diff --git a/.gitattributes b/.gitattributes index f5555e58818ec369c49d99e902cb8b768e32ec20..86a861a820f7108ce39f6eb66320bb5e8b9e3a06 100644 --- a/.gitattributes +++ b/.gitattributes @@ -34,3 +34,5 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text *.zst filter=lfs diff=lfs merge=lfs -text *tfevents* filter=lfs diff=lfs merge=lfs -text git.diff filter=lfs diff=lfs merge=lfs -text +replay.mp4 filter=lfs diff=lfs merge=lfs -text +sf_log.txt filter=lfs diff=lfs merge=lfs -text diff --git a/.summary/0/events.out.tfevents.1697546584.rhmmedcatt-proliant-ml350-gen10 b/.summary/0/events.out.tfevents.1697546584.rhmmedcatt-proliant-ml350-gen10 new file mode 100644 index 0000000000000000000000000000000000000000..5928047bdb3c8b1c797cb92578831b89a23473c2 --- /dev/null +++ b/.summary/0/events.out.tfevents.1697546584.rhmmedcatt-proliant-ml350-gen10 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca679b85b37b196bcd04a0962b3e12a82267fd1a90c56c57ef279d41ad96a4a0 +size 47071849 diff --git a/.summary/1/events.out.tfevents.1697546584.rhmmedcatt-proliant-ml350-gen10 b/.summary/1/events.out.tfevents.1697546584.rhmmedcatt-proliant-ml350-gen10 new file mode 100644 index 0000000000000000000000000000000000000000..338ffad1f1260eb65562718d77a3f142e777d1b2 --- /dev/null +++ b/.summary/1/events.out.tfevents.1697546584.rhmmedcatt-proliant-ml350-gen10 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22e529c942378f50a418c3dd4d52a9f7cb3e7db405efe76c8d80a994d05771e9 +size 24889961 diff --git a/README.md b/README.md index 209ef88a52963e42c56e9fa4761d96184b404ced..48686c511586f091282ee240856f5ad1ff0d4811 100644 --- a/README.md +++ b/README.md @@ -15,7 +15,7 @@ model-index: type: atari_asteroid metrics: - type: mean_reward - value: 1218.00 +/- 462.14 + value: 225993.00 +/- 112245.84 name: mean_reward verified: false --- @@ -24,6 +24,7 @@ model-index: This project is an attempt to maximise performance of high sample throughput APPO RL models in Atari environments in as carbon efficient a manner as possible using a single, not particularly high performance single machine. It is about demonstrating the generalisability of on-policy algorithms to create good performance quickly (by sacrificing sample efficiency) while also proving that this route to RL production is accessible to even hobbyists like me (I am a gastroenterologist not a computer scientist). +In terms of throughput I am managing to reach throughputs of 2,500 - 3,000 across both policies using sample factory using two Quadro P2200's (not particularly powerful GPUs) each loaded up about 60% (3GB). Previously using the stable baselines 3 (sb3) implementation of PPO it would take about a week to train an atari agent to 100 million timesteps synchronously. By comparison the sample factory async implementation takes only just over 2 hours to achieve the same result. That is about 84 times faster with only typically a 21 watt burn per GPU. I am thus very grateful to Alex Petrenko and all the sample factory team for their work on this. ## Project Aims diff --git a/checkpoint_p0/best_001117600_286105600_reward_1315.400.pth b/checkpoint_p0/best_001117600_286105600_reward_1315.400.pth new file mode 100644 index 0000000000000000000000000000000000000000..141f6919e9ba8423e97c67ea5a38d2ea6373b32a --- /dev/null +++ b/checkpoint_p0/best_001117600_286105600_reward_1315.400.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2fa8c9ad092341acf8945c2edb2db0f6df9b82cfb7c12638c1e54d63f847aaa4 +size 20771187 diff --git a/checkpoint_p0/checkpoint_001145536_293257216.pth b/checkpoint_p0/checkpoint_001145536_293257216.pth new file mode 100644 index 0000000000000000000000000000000000000000..d221433150002d4a461acbdbf0edbea9a9d50689 --- /dev/null +++ b/checkpoint_p0/checkpoint_001145536_293257216.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90822f78d275766fcd5939a3c22fa700bbb01a9e8d106fc9980afc63b12acbb5 +size 20771651 diff --git a/checkpoint_p0/checkpoint_001146400_293478400.pth b/checkpoint_p0/checkpoint_001146400_293478400.pth new file mode 100644 index 0000000000000000000000000000000000000000..458845996d89e1458d63fa3d7cf2cd3c3ba16dbb --- /dev/null +++ b/checkpoint_p0/checkpoint_001146400_293478400.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5bef34215ef58e6e41a9984ea73e4e79a509eb7499b73bbd6fcd254b776c3d4 +size 20771651 diff --git a/checkpoint_p0/milestones/checkpoint_000017344_4440064.pth b/checkpoint_p0/milestones/checkpoint_000017344_4440064.pth new file mode 100644 index 0000000000000000000000000000000000000000..18f2c92e5834cc89427989ad747de26d384372a5 --- /dev/null +++ b/checkpoint_p0/milestones/checkpoint_000017344_4440064.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e101a2394d47e125bd7f2096783b784b614139d8cd08a9f03cf9322bcb94bdd +size 20772507 diff --git a/checkpoint_p0/milestones/checkpoint_000031424_8044544.pth b/checkpoint_p0/milestones/checkpoint_000031424_8044544.pth new file mode 100644 index 0000000000000000000000000000000000000000..4431aa6ab238338529d6924fb674a45dc9a6fc33 --- /dev/null +++ b/checkpoint_p0/milestones/checkpoint_000031424_8044544.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7a0437495c34a5f9772784929973fdacd95a82a99f965c52992f7ff1e44c0e7 +size 20772507 diff --git a/checkpoint_p0/milestones/checkpoint_000045504_11649024.pth b/checkpoint_p0/milestones/checkpoint_000045504_11649024.pth new file mode 100644 index 0000000000000000000000000000000000000000..12d2fd73aff8a19ab2726ac56f4057218abb8d0a --- /dev/null +++ b/checkpoint_p0/milestones/checkpoint_000045504_11649024.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6005e88615cfcf024f34edb92ead07024970a747e98a8c0252fdd0f48c9e1527 +size 20772563 diff --git a/checkpoint_p0/milestones/checkpoint_000059648_15269888.pth b/checkpoint_p0/milestones/checkpoint_000059648_15269888.pth new file mode 100644 index 0000000000000000000000000000000000000000..cbe7326efcda9fb3a08ece83c985f0c7a0edbf73 --- /dev/null +++ b/checkpoint_p0/milestones/checkpoint_000059648_15269888.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:044a336b4fd5a63c184b40d0e87e1e4b68cf530bf93d3c0fff11850fd73a7b59 +size 20772563 diff --git a/checkpoint_p0/milestones/checkpoint_000073696_18866176.pth b/checkpoint_p0/milestones/checkpoint_000073696_18866176.pth new file mode 100644 index 0000000000000000000000000000000000000000..4341521226952deefcddfcade656a0d506b0994c --- /dev/null +++ b/checkpoint_p0/milestones/checkpoint_000073696_18866176.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce35bfc3bfc3645a2ad50c377ebcb69d5b391739498f3a4849406bd87d4342c8 +size 20772563 diff --git a/checkpoint_p0/milestones/checkpoint_000087808_22478848.pth b/checkpoint_p0/milestones/checkpoint_000087808_22478848.pth new file mode 100644 index 0000000000000000000000000000000000000000..6dfcdf7a4151a5276c44d945f1666bd92d3be970 --- /dev/null +++ b/checkpoint_p0/milestones/checkpoint_000087808_22478848.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f2de14f7b2a0451f82f728c29ff19ee639a9660c4560f4213c6acdb9aeeb024 +size 20772563 diff --git a/checkpoint_p0/milestones/checkpoint_000101952_26099712.pth b/checkpoint_p0/milestones/checkpoint_000101952_26099712.pth new file mode 100644 index 0000000000000000000000000000000000000000..2857c21f205b6f24a951705d594c3083c38f3b45 --- /dev/null +++ b/checkpoint_p0/milestones/checkpoint_000101952_26099712.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea933d8882803349f787e7ddca0bdfd26ad2823e2c0259ae012aefa568a120d3 +size 20772563 diff --git a/checkpoint_p0/milestones/checkpoint_000116224_29753344.pth b/checkpoint_p0/milestones/checkpoint_000116224_29753344.pth new file mode 100644 index 0000000000000000000000000000000000000000..93adae421a18bdef1a736dd9a96bfd90136fea8b --- /dev/null +++ b/checkpoint_p0/milestones/checkpoint_000116224_29753344.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7eb391a1069c5226abed3d57f3da0e177741be6b1c7bc34d40dc6af0810a58fc +size 20772563 diff --git a/checkpoint_p0/milestones/checkpoint_000130496_33406976.pth b/checkpoint_p0/milestones/checkpoint_000130496_33406976.pth new file mode 100644 index 0000000000000000000000000000000000000000..f5e1c9cf302171461546da409ea1e2e33c1eb32e --- /dev/null +++ b/checkpoint_p0/milestones/checkpoint_000130496_33406976.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37fdf618e00fc4877cc07957cd8e6ebeaf2b39755c267f5934589a12d629c2e7 +size 20772563 diff --git a/checkpoint_p0/milestones/checkpoint_000144800_37068800.pth b/checkpoint_p0/milestones/checkpoint_000144800_37068800.pth new file mode 100644 index 0000000000000000000000000000000000000000..3f40ea7ea86d6867ebc44d9db808cc5ed3926ea4 --- /dev/null +++ b/checkpoint_p0/milestones/checkpoint_000144800_37068800.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8b644fd25a139e991b47ce7d0d7a21329af1f8d03a5d59c47733885fbd18676 +size 20772563 diff --git a/checkpoint_p0/milestones/checkpoint_000159136_40738816.pth b/checkpoint_p0/milestones/checkpoint_000159136_40738816.pth new file mode 100644 index 0000000000000000000000000000000000000000..07c4d5740678be58b3ebcfd4e1ef5a203a45163c --- /dev/null +++ b/checkpoint_p0/milestones/checkpoint_000159136_40738816.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b933e100ff4eb9a8a5171d459ddd5b62ba3e453a8cabfbe367b6dd0d2521120 +size 20772563 diff --git a/checkpoint_p0/milestones/checkpoint_000173504_44417024.pth b/checkpoint_p0/milestones/checkpoint_000173504_44417024.pth new file mode 100644 index 0000000000000000000000000000000000000000..e374c86f77af031efa4464f25367c71fe91b5844 --- /dev/null +++ b/checkpoint_p0/milestones/checkpoint_000173504_44417024.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33c5ebaed7b4997c5b56e708556f50c2addf0b28352d080e08f80d7dd563bab7 +size 20772563 diff --git a/checkpoint_p0/milestones/checkpoint_000187872_48095232.pth b/checkpoint_p0/milestones/checkpoint_000187872_48095232.pth new file mode 100644 index 0000000000000000000000000000000000000000..f208218b76040939f4f17847f4d54ae49acc755b --- /dev/null +++ b/checkpoint_p0/milestones/checkpoint_000187872_48095232.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f8d004205f3cebc5752d0bd436223063dca95108e2e65291adbe96c00bd283d +size 20772563 diff --git a/checkpoint_p0/milestones/checkpoint_000202208_51765248.pth b/checkpoint_p0/milestones/checkpoint_000202208_51765248.pth new file mode 100644 index 0000000000000000000000000000000000000000..79b65314f22b4a953055fb2ff26168cdcb40a681 --- /dev/null +++ b/checkpoint_p0/milestones/checkpoint_000202208_51765248.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:abb40b8e1daa3793e525a2891ef69480a134c74fb72f98b1d8843594e9e636f0 +size 20772563 diff --git a/checkpoint_p0/milestones/checkpoint_000216608_55451648.pth b/checkpoint_p0/milestones/checkpoint_000216608_55451648.pth new file mode 100644 index 0000000000000000000000000000000000000000..28188107159af77a6ffa076f9bfd92a40ce87a26 --- /dev/null +++ b/checkpoint_p0/milestones/checkpoint_000216608_55451648.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5945a45fea6a11cc3baf802f20e29ddb7dfdbc4c81202b92f1e2dc07f7d92c4b +size 20772563 diff --git a/checkpoint_p0/milestones/checkpoint_000230912_59113472.pth b/checkpoint_p0/milestones/checkpoint_000230912_59113472.pth new file mode 100644 index 0000000000000000000000000000000000000000..8b6b2415875b177295cfffd3fb3412c81ea969e5 --- /dev/null +++ b/checkpoint_p0/milestones/checkpoint_000230912_59113472.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb20a4336d3c595434f6740be33cc6933702e360a6e024aa7ce5ec8973b83b97 +size 20772563 diff --git a/checkpoint_p0/milestones/checkpoint_000245248_62783488.pth b/checkpoint_p0/milestones/checkpoint_000245248_62783488.pth new file mode 100644 index 0000000000000000000000000000000000000000..b2383f60370616f2590c1d6b67b259ac4606cdb3 --- /dev/null +++ b/checkpoint_p0/milestones/checkpoint_000245248_62783488.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:071327ab7a0624276b85454c0969903817d89ff157523ec5a77225bfb60fabce +size 20772563 diff --git a/checkpoint_p0/milestones/checkpoint_000259552_66445312.pth b/checkpoint_p0/milestones/checkpoint_000259552_66445312.pth new file mode 100644 index 0000000000000000000000000000000000000000..e5034e556d1d8903edd67ff3779c25e3a23d2e17 --- /dev/null +++ b/checkpoint_p0/milestones/checkpoint_000259552_66445312.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ebcbf5053199bc8e75f4387b6d8d003f7e6d70b5c922ca473a49ed07d8d3124a +size 20772563 diff --git a/checkpoint_p0/milestones/checkpoint_000273856_70107136.pth b/checkpoint_p0/milestones/checkpoint_000273856_70107136.pth new file mode 100644 index 0000000000000000000000000000000000000000..100f9b0ed729db69e547b8aeec9c6e9352cf541e --- /dev/null +++ b/checkpoint_p0/milestones/checkpoint_000273856_70107136.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1baae4a4ffbf2570774fb89048800e592dc275b7074009b44001f541c1c86819 +size 20772563 diff --git a/checkpoint_p0/milestones/checkpoint_000288160_73768960.pth b/checkpoint_p0/milestones/checkpoint_000288160_73768960.pth new file mode 100644 index 0000000000000000000000000000000000000000..3fe580e0743f5ce840df8a79258a5303e41b718c --- /dev/null +++ b/checkpoint_p0/milestones/checkpoint_000288160_73768960.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20b85d7cd7cdaab3111de30e600f1d09d35fe43a90dfa8e33409cdda591e1b3 +size 20772563 diff --git a/checkpoint_p0/milestones/checkpoint_000302528_77447168.pth b/checkpoint_p0/milestones/checkpoint_000302528_77447168.pth new file mode 100644 index 0000000000000000000000000000000000000000..4f293ae0a75e7c2aecb31208a4fa70fcd7c9b342 --- /dev/null +++ b/checkpoint_p0/milestones/checkpoint_000302528_77447168.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f79222a5ec60fe41bc1d9216b7c6434ae2f3eb6ce9b53ff6ad6703b2543d10ac +size 20772563 diff --git a/checkpoint_p0/milestones/checkpoint_000316832_81108992.pth b/checkpoint_p0/milestones/checkpoint_000316832_81108992.pth new file mode 100644 index 0000000000000000000000000000000000000000..f1342061dc2e7667df6824a9b2818dd8a02a3e0c --- /dev/null +++ b/checkpoint_p0/milestones/checkpoint_000316832_81108992.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c573c402b6c2f4a09d33c6cd0d4a862a62a0a8b830cb13de5e145526cc635ff1 +size 20772563 diff --git a/checkpoint_p0/milestones/checkpoint_000331168_84779008.pth b/checkpoint_p0/milestones/checkpoint_000331168_84779008.pth new file mode 100644 index 0000000000000000000000000000000000000000..817c68bf2889b193d4d8b944b40bfabb337cb0b0 --- /dev/null +++ b/checkpoint_p0/milestones/checkpoint_000331168_84779008.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2a696955e14c6bc2350c260d49e0ce1e1ef2636ce9530deeff2b2d5e193a918 +size 20772563 diff --git a/checkpoint_p0/milestones/checkpoint_000345408_88424448.pth b/checkpoint_p0/milestones/checkpoint_000345408_88424448.pth new file mode 100644 index 0000000000000000000000000000000000000000..4a167ab3ce8c47f7cbe3349629dea6cd5b3ee508 --- /dev/null +++ b/checkpoint_p0/milestones/checkpoint_000345408_88424448.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7f7f39212335d9c6381adbc1ca4c7819d96916520518994f8e5b81c3787b88f +size 20772563 diff --git a/checkpoint_p0/milestones/checkpoint_000359776_92102656.pth b/checkpoint_p0/milestones/checkpoint_000359776_92102656.pth new file mode 100644 index 0000000000000000000000000000000000000000..4a6afd1cb312c4e4fa2ee8d1a152df81258d278b --- /dev/null +++ b/checkpoint_p0/milestones/checkpoint_000359776_92102656.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d79655a6da23a9c737bed5a5f909a0dd8b240555a48844bd874693c5b7b6b07f +size 20772563 diff --git a/checkpoint_p0/milestones/checkpoint_000374144_95780864.pth b/checkpoint_p0/milestones/checkpoint_000374144_95780864.pth new file mode 100644 index 0000000000000000000000000000000000000000..ff86e6503e95a7a0771f3547aa8ace5a1f4c2c04 --- /dev/null +++ b/checkpoint_p0/milestones/checkpoint_000374144_95780864.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39a88cbd121b2b0fd808ff5baf58454b64d107021043d6087fa5df2f0cae41a5 +size 20772563 diff --git a/checkpoint_p0/milestones/checkpoint_000388544_99467264.pth b/checkpoint_p0/milestones/checkpoint_000388544_99467264.pth new file mode 100644 index 0000000000000000000000000000000000000000..d5677f77170df6f703ae9e44a5d11483e94e0efa --- /dev/null +++ b/checkpoint_p0/milestones/checkpoint_000388544_99467264.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1d9a824166d33ec5e3e928b5ee712b52a535167ee8750bca5d88946a3d52aec +size 20772563 diff --git a/checkpoint_p0/milestones/checkpoint_000402848_103129088.pth b/checkpoint_p0/milestones/checkpoint_000402848_103129088.pth new file mode 100644 index 0000000000000000000000000000000000000000..3905d23324fc31f336740500683fbf2c4ea5893d --- /dev/null +++ b/checkpoint_p0/milestones/checkpoint_000402848_103129088.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ffd67763646672873ec1d79b4746af6635ad3187c04a3fb62591b18efceceb78 +size 20772619 diff --git a/checkpoint_p0/milestones/checkpoint_000417120_106782720.pth b/checkpoint_p0/milestones/checkpoint_000417120_106782720.pth new file mode 100644 index 0000000000000000000000000000000000000000..5cd37daa6023386ff5550b7117d8d1636874c2ee --- /dev/null +++ b/checkpoint_p0/milestones/checkpoint_000417120_106782720.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1819c25cd923f4349956fc1a0cc1b70f2baf526226b332aa7fab8b53f377e3d8 +size 20772619 diff --git a/checkpoint_p0/milestones/checkpoint_000431488_110460928.pth b/checkpoint_p0/milestones/checkpoint_000431488_110460928.pth new file mode 100644 index 0000000000000000000000000000000000000000..4727e174a8b0a6ca7f4d12f68609fb3a259e71d8 --- /dev/null +++ b/checkpoint_p0/milestones/checkpoint_000431488_110460928.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e215e2d8028277f28ad794dfbe2b4267d2cde27588d9e3dad329c631cba0cadc +size 20772619 diff --git a/checkpoint_p0/milestones/checkpoint_000445760_114114560.pth b/checkpoint_p0/milestones/checkpoint_000445760_114114560.pth new file mode 100644 index 0000000000000000000000000000000000000000..356ef9ee3331b6044755043039a75ecc155637d7 --- /dev/null +++ b/checkpoint_p0/milestones/checkpoint_000445760_114114560.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:caf8ca679b447e8fc6069488f4b4012b9f8c4787a2b30c63a3df425449b466c5 +size 20772619 diff --git a/checkpoint_p0/milestones/checkpoint_000460128_117792768.pth b/checkpoint_p0/milestones/checkpoint_000460128_117792768.pth new file mode 100644 index 0000000000000000000000000000000000000000..b049a61f776b691f9d945ad7a1e2621715fec3e5 --- /dev/null +++ b/checkpoint_p0/milestones/checkpoint_000460128_117792768.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c84021872691c617e22658d38b5e8cb654c5ff54a325a07cea28e43f8dc5efc +size 20772619 diff --git a/checkpoint_p0/milestones/checkpoint_000474496_121470976.pth b/checkpoint_p0/milestones/checkpoint_000474496_121470976.pth new file mode 100644 index 0000000000000000000000000000000000000000..049fb3c3b91674266fcae934d57c531ec98b912b --- /dev/null +++ b/checkpoint_p0/milestones/checkpoint_000474496_121470976.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4064e396f2ede028f14f292762d49043a89b0daa36787999be819a58b14a44fc +size 20772619 diff --git a/checkpoint_p0/milestones/checkpoint_000488832_125140992.pth b/checkpoint_p0/milestones/checkpoint_000488832_125140992.pth new file mode 100644 index 0000000000000000000000000000000000000000..db7091d04d98866e8981cbac95d08843dcd8ddcf --- /dev/null +++ b/checkpoint_p0/milestones/checkpoint_000488832_125140992.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46db5cc970b768746e1441dd8734d1bd4425aa7a7969b0bf7f264c4fb036b95b +size 20772619 diff --git a/checkpoint_p0/milestones/checkpoint_000503136_128802816.pth b/checkpoint_p0/milestones/checkpoint_000503136_128802816.pth new file mode 100644 index 0000000000000000000000000000000000000000..39b5d8e8fa72c92da317c474fc5ad6ad8f4e5ebe --- /dev/null +++ b/checkpoint_p0/milestones/checkpoint_000503136_128802816.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cbd0d003a672abc18f423a524731e74f5659e55252180d83041b876b4e02f9d9 +size 20772619 diff --git a/checkpoint_p0/milestones/checkpoint_000517472_132472832.pth b/checkpoint_p0/milestones/checkpoint_000517472_132472832.pth new file mode 100644 index 0000000000000000000000000000000000000000..d7988938c9cd84019bb75ee2743f119e798806eb --- /dev/null +++ b/checkpoint_p0/milestones/checkpoint_000517472_132472832.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:220438a8384c32c2a6874603198f89edc2eab0c9f5f66f53c0ce19ed9977cded +size 20772619 diff --git a/checkpoint_p0/milestones/checkpoint_000531744_136126464.pth b/checkpoint_p0/milestones/checkpoint_000531744_136126464.pth new file mode 100644 index 0000000000000000000000000000000000000000..910de03d8cfc76b58cc3a54ea63e33c487f75ee5 --- /dev/null +++ b/checkpoint_p0/milestones/checkpoint_000531744_136126464.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9a10a92a045e32c291ca7f746f4d3c362a0acec8627222b18f619e4dbdf572b +size 20772619 diff --git a/checkpoint_p0/milestones/checkpoint_000546080_139796480.pth b/checkpoint_p0/milestones/checkpoint_000546080_139796480.pth new file mode 100644 index 0000000000000000000000000000000000000000..7b694fbf675826154d48e4785d31323ab59b341c --- /dev/null +++ b/checkpoint_p0/milestones/checkpoint_000546080_139796480.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ac690b4ae75c5d1d6d3b9b4805feed6028f690c74b8c069140bbf69ecbacab9 +size 20772619 diff --git a/checkpoint_p0/milestones/checkpoint_000560320_143441920.pth b/checkpoint_p0/milestones/checkpoint_000560320_143441920.pth new file mode 100644 index 0000000000000000000000000000000000000000..dea4737282a747bb7cad4faed10c58ea49c78093 --- /dev/null +++ b/checkpoint_p0/milestones/checkpoint_000560320_143441920.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:beb0529a780707f6ffd4de7dc81567b16f4aa31753561ddd922cfece980f1de5 +size 20772619 diff --git a/checkpoint_p0/milestones/checkpoint_000574656_147111936.pth b/checkpoint_p0/milestones/checkpoint_000574656_147111936.pth new file mode 100644 index 0000000000000000000000000000000000000000..be74325a1366cff481fa2f14cdf6632bc86627b4 --- /dev/null +++ b/checkpoint_p0/milestones/checkpoint_000574656_147111936.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8e0eef3825f235db75bf8c31c47637d91d5199f2aab23bc21b0540a0bd4cbd3 +size 20772619 diff --git a/checkpoint_p0/milestones/checkpoint_000588960_150773760.pth b/checkpoint_p0/milestones/checkpoint_000588960_150773760.pth new file mode 100644 index 0000000000000000000000000000000000000000..84d5d0577e6f88278e498c2c9e4e681cccb7c84c --- /dev/null +++ b/checkpoint_p0/milestones/checkpoint_000588960_150773760.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5d3c92f6416e33b04e98200eaa6eac3f61461c942a49a72ff5b9f7104cc7920 +size 20772619 diff --git a/checkpoint_p0/milestones/checkpoint_000603232_154427392.pth b/checkpoint_p0/milestones/checkpoint_000603232_154427392.pth new file mode 100644 index 0000000000000000000000000000000000000000..5ebae64d7ce15a62ce8edf30f8e712a87fdb678d --- /dev/null +++ b/checkpoint_p0/milestones/checkpoint_000603232_154427392.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0eda89977159370337e7a0580e1891713a4cb80ba6e2234c58ce3af04d51a32f +size 20772619 diff --git a/checkpoint_p0/milestones/checkpoint_000617504_158081024.pth b/checkpoint_p0/milestones/checkpoint_000617504_158081024.pth new file mode 100644 index 0000000000000000000000000000000000000000..6c761effb6000f88ccba8aaeab835a29beb6ae84 --- /dev/null +++ b/checkpoint_p0/milestones/checkpoint_000617504_158081024.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:354a74580251dc6bec99585805ebc1857da3dd1aa322f1088a4627191df990e4 +size 20772619 diff --git a/checkpoint_p0/milestones/checkpoint_000631808_161742848.pth b/checkpoint_p0/milestones/checkpoint_000631808_161742848.pth new file mode 100644 index 0000000000000000000000000000000000000000..be384e31c4b38465fda8b8107a8a8544db1f5ef0 --- /dev/null +++ b/checkpoint_p0/milestones/checkpoint_000631808_161742848.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83b027059ecb7a4e5a5d4494414ce771cb4d27d8e42d81a00b2eebf6a34f1459 +size 20772619 diff --git a/checkpoint_p0/milestones/checkpoint_000646144_165412864.pth b/checkpoint_p0/milestones/checkpoint_000646144_165412864.pth new file mode 100644 index 0000000000000000000000000000000000000000..37ff8eec97ecabc242ca6cbac47e75780b9fe76d --- /dev/null +++ b/checkpoint_p0/milestones/checkpoint_000646144_165412864.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50cc78b7d4c959f44705d7babd583c9521c7ef4115083a8eba9996228cea13cd +size 20772619 diff --git a/checkpoint_p0/milestones/checkpoint_000660576_169107456.pth b/checkpoint_p0/milestones/checkpoint_000660576_169107456.pth new file mode 100644 index 0000000000000000000000000000000000000000..0745007a1b6256d5f6f2d279b13574d3dbc5500b --- /dev/null +++ b/checkpoint_p0/milestones/checkpoint_000660576_169107456.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ada935148397f57976d9a5096e125b0f32360873db338cca464070c8f36596b +size 20772619 diff --git a/checkpoint_p0/milestones/checkpoint_000674912_172777472.pth b/checkpoint_p0/milestones/checkpoint_000674912_172777472.pth new file mode 100644 index 0000000000000000000000000000000000000000..f4e5087cb96e8d7367ab40967c73a4ccc768da8c --- /dev/null +++ b/checkpoint_p0/milestones/checkpoint_000674912_172777472.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe6426f416ee6280adf065f54245eefd834e9ca9b2cb92d97f39a613972b388a +size 20772619 diff --git a/checkpoint_p0/milestones/checkpoint_000689248_176447488.pth b/checkpoint_p0/milestones/checkpoint_000689248_176447488.pth new file mode 100644 index 0000000000000000000000000000000000000000..f868a2e9984eb8a0a9dcff4f907bf6a1d071d1b3 --- /dev/null +++ b/checkpoint_p0/milestones/checkpoint_000689248_176447488.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5037c3b60b6f5a1f2f24d221937bca7d1d71ddf412470f90c4cf0107e4a93344 +size 20772619 diff --git a/checkpoint_p0/milestones/checkpoint_000703616_180125696.pth b/checkpoint_p0/milestones/checkpoint_000703616_180125696.pth new file mode 100644 index 0000000000000000000000000000000000000000..1e82ab842e3f043e870bfb472200bf62fd4f9bf2 --- /dev/null +++ b/checkpoint_p0/milestones/checkpoint_000703616_180125696.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a971c04bc30587c2ea055254eb3918b2eaad59aec5663c10587c02a21b755193 +size 20772619 diff --git a/checkpoint_p0/milestones/checkpoint_000717984_183803904.pth b/checkpoint_p0/milestones/checkpoint_000717984_183803904.pth new file mode 100644 index 0000000000000000000000000000000000000000..39116d41b4d3acfecf4e11cc252d432c2b7691d8 --- /dev/null +++ b/checkpoint_p0/milestones/checkpoint_000717984_183803904.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:961803187b9d21b5a96309f29cf1a70a3cdc53b119d374c7796a9aa8fbcb6717 +size 20772619 diff --git a/checkpoint_p0/milestones/checkpoint_000732320_187473920.pth b/checkpoint_p0/milestones/checkpoint_000732320_187473920.pth new file mode 100644 index 0000000000000000000000000000000000000000..9ee5785580b72ec32b5cffa217140d7fe83e3529 --- /dev/null +++ b/checkpoint_p0/milestones/checkpoint_000732320_187473920.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a41eee75021344c7dee01446c5cc3a49930b19db2e7252f51f43608af18b0b5 +size 20772619 diff --git a/checkpoint_p0/milestones/checkpoint_000746624_191135744.pth b/checkpoint_p0/milestones/checkpoint_000746624_191135744.pth new file mode 100644 index 0000000000000000000000000000000000000000..c53a062b2aa231f7c5e914dea6f854f960470828 --- /dev/null +++ b/checkpoint_p0/milestones/checkpoint_000746624_191135744.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:518f60b0717a4ff205526f71ae2a19c4aef8c627c3b439653e8219ab3eb4f1bb +size 20772619 diff --git a/checkpoint_p0/milestones/checkpoint_000760928_194797568.pth b/checkpoint_p0/milestones/checkpoint_000760928_194797568.pth new file mode 100644 index 0000000000000000000000000000000000000000..1fe49cea736f872691f6f732ca221963dc0a2c06 --- /dev/null +++ b/checkpoint_p0/milestones/checkpoint_000760928_194797568.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ca91e929b713b8a36d5d60c83a89d7ebb64cb3e505a5e27dd1d4809bed231d7 +size 20772619 diff --git a/checkpoint_p0/milestones/checkpoint_000775200_198451200.pth b/checkpoint_p0/milestones/checkpoint_000775200_198451200.pth new file mode 100644 index 0000000000000000000000000000000000000000..1390436b114e3f5ac218c1399db512dec4b1a04b --- /dev/null +++ b/checkpoint_p0/milestones/checkpoint_000775200_198451200.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5244950043861057a0e0dd19aa4decdcd5d6da22cb7283064957a3f44db16696 +size 20772619 diff --git a/checkpoint_p0/milestones/checkpoint_000789504_202113024.pth b/checkpoint_p0/milestones/checkpoint_000789504_202113024.pth new file mode 100644 index 0000000000000000000000000000000000000000..f7465ec80ae4ddb092bfacb4bec4e8cae46de82d --- /dev/null +++ b/checkpoint_p0/milestones/checkpoint_000789504_202113024.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b178ff2dc0d2537b30a935127af64ce18b8b4bb9cd71cd3bb5274336af0b9993 +size 20772619 diff --git a/checkpoint_p0/milestones/checkpoint_000803808_205774848.pth b/checkpoint_p0/milestones/checkpoint_000803808_205774848.pth new file mode 100644 index 0000000000000000000000000000000000000000..73f60f122772de436fe3fdf3de756934d7e42ed5 --- /dev/null +++ b/checkpoint_p0/milestones/checkpoint_000803808_205774848.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:61ea347a09c224769304c21cf683ad46c3b1f7e5c7a330be2355e2b07fded642 +size 20772619 diff --git a/checkpoint_p0/milestones/checkpoint_000818144_209444864.pth b/checkpoint_p0/milestones/checkpoint_000818144_209444864.pth new file mode 100644 index 0000000000000000000000000000000000000000..9428ac2b7124854f67e1b6517c152698ee3b9354 --- /dev/null +++ b/checkpoint_p0/milestones/checkpoint_000818144_209444864.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:646e5bcc91e4d07c45fe99cbb40c54a7cf809c229e8091dc92e7edd566b3ebb6 +size 20772619 diff --git a/checkpoint_p0/milestones/checkpoint_000832512_213123072.pth b/checkpoint_p0/milestones/checkpoint_000832512_213123072.pth new file mode 100644 index 0000000000000000000000000000000000000000..d14d24b0c71c3307d4eec92cbc87934751871560 --- /dev/null +++ b/checkpoint_p0/milestones/checkpoint_000832512_213123072.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cccbcc410fa33cc4efef8d7cb4830a1b47c4909faafd0f18a9567926bb756512 +size 20772619 diff --git a/checkpoint_p0/milestones/checkpoint_000846784_216776704.pth b/checkpoint_p0/milestones/checkpoint_000846784_216776704.pth new file mode 100644 index 0000000000000000000000000000000000000000..74459fe22887b3ca02dd59383afe24ec11b4a8e7 --- /dev/null +++ b/checkpoint_p0/milestones/checkpoint_000846784_216776704.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba102cd3421050ab858f3e06d604eb9f3a194d8f3c54e0dc2451eb834ee7a6a3 +size 20772619 diff --git a/checkpoint_p0/milestones/checkpoint_000861088_220438528.pth b/checkpoint_p0/milestones/checkpoint_000861088_220438528.pth new file mode 100644 index 0000000000000000000000000000000000000000..3b3a6a08a16d043d66b8815aacc99715e4aab8d6 --- /dev/null +++ b/checkpoint_p0/milestones/checkpoint_000861088_220438528.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17328becbf5b6f17b7d7e067269527a61a590c7f9f2b9d8962e42dc205ed1ddc +size 20772619 diff --git a/checkpoint_p0/milestones/checkpoint_000875424_224108544.pth b/checkpoint_p0/milestones/checkpoint_000875424_224108544.pth new file mode 100644 index 0000000000000000000000000000000000000000..bad42535991b5a7a696f21d660f7aeb72085564d --- /dev/null +++ b/checkpoint_p0/milestones/checkpoint_000875424_224108544.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:167b1cfe8c1b31be5119a68f466c3a968b52b266f2a790f9b35a1200fe85a1b1 +size 20772619 diff --git a/checkpoint_p0/milestones/checkpoint_000889792_227786752.pth b/checkpoint_p0/milestones/checkpoint_000889792_227786752.pth new file mode 100644 index 0000000000000000000000000000000000000000..91234bf44b4e7bc2375812bfa2e0e0934abe2720 --- /dev/null +++ b/checkpoint_p0/milestones/checkpoint_000889792_227786752.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d605fbfa366245037568a930816cced1ec30e340adb07684effc3cf5cfd4850 +size 20772619 diff --git a/checkpoint_p0/milestones/checkpoint_000904128_231456768.pth b/checkpoint_p0/milestones/checkpoint_000904128_231456768.pth new file mode 100644 index 0000000000000000000000000000000000000000..886d8505a9c8e3fe25f8a1320f0af2faeb1cef80 --- /dev/null +++ b/checkpoint_p0/milestones/checkpoint_000904128_231456768.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:837ab4447bd4d7f5eb1e2b4b13e8d7f9dd6b7bf198ca667e59bea848beb2e5d4 +size 20772619 diff --git a/checkpoint_p0/milestones/checkpoint_000918464_235126784.pth b/checkpoint_p0/milestones/checkpoint_000918464_235126784.pth new file mode 100644 index 0000000000000000000000000000000000000000..02c6c9b3e6f0afe34c64d30eb98662c96a93c7cc --- /dev/null +++ b/checkpoint_p0/milestones/checkpoint_000918464_235126784.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:330f79ee90a64d29f19d398d621ddcd97aa4e9ac5706c53fd3489569c17c8246 +size 20772619 diff --git a/checkpoint_p0/milestones/checkpoint_000932768_238788608.pth b/checkpoint_p0/milestones/checkpoint_000932768_238788608.pth new file mode 100644 index 0000000000000000000000000000000000000000..ba9dbd3910c7b12a6c800ea69c2ce76113482cd1 --- /dev/null +++ b/checkpoint_p0/milestones/checkpoint_000932768_238788608.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d92488fe4349e94f31fa4c40e17f39177d69081cd5c2ba4455aadb525fd9ce83 +size 20772619 diff --git a/checkpoint_p0/milestones/checkpoint_000947104_242458624.pth b/checkpoint_p0/milestones/checkpoint_000947104_242458624.pth new file mode 100644 index 0000000000000000000000000000000000000000..077379579991812d18ec5f3caa67a387a5cdfb38 --- /dev/null +++ b/checkpoint_p0/milestones/checkpoint_000947104_242458624.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29109d01a23a6a85b7aec36284d74f39bec2d851db8a5e8dd059330a0280b100 +size 20772619 diff --git a/checkpoint_p0/milestones/checkpoint_000961344_246104064.pth b/checkpoint_p0/milestones/checkpoint_000961344_246104064.pth new file mode 100644 index 0000000000000000000000000000000000000000..1d1e482bd4395c4fefc4c2fe25b870411de4748f --- /dev/null +++ b/checkpoint_p0/milestones/checkpoint_000961344_246104064.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5187bd1cef41349a7a1222b5770af27f6f167a079a5a230e8c37000f69c80263 +size 20772619 diff --git a/checkpoint_p0/milestones/checkpoint_000975616_249757696.pth b/checkpoint_p0/milestones/checkpoint_000975616_249757696.pth new file mode 100644 index 0000000000000000000000000000000000000000..0cc6aa94b54c31dc13e132082b66f8283639d08e --- /dev/null +++ b/checkpoint_p0/milestones/checkpoint_000975616_249757696.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b284be8e32f59ecb8c96f456beabc753ff9d685f93790f181a9d92e6d834d5d7 +size 20772619 diff --git a/checkpoint_p0/milestones/checkpoint_000989952_253427712.pth b/checkpoint_p0/milestones/checkpoint_000989952_253427712.pth new file mode 100644 index 0000000000000000000000000000000000000000..f3c244718757f3f2fb3849eafc9d3fd103438f54 --- /dev/null +++ b/checkpoint_p0/milestones/checkpoint_000989952_253427712.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1a858cc9fec690d12af840109fcb3738b082367f8e8217139b435a6142b82f5 +size 20772619 diff --git a/checkpoint_p0/milestones/checkpoint_001004224_257081344.pth b/checkpoint_p0/milestones/checkpoint_001004224_257081344.pth new file mode 100644 index 0000000000000000000000000000000000000000..e6b5f30a90852a3e055a59f303affec045c7b8cf --- /dev/null +++ b/checkpoint_p0/milestones/checkpoint_001004224_257081344.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ecb02790ca8f16dc0e4b100ec3b420997189a7806cc5654636f5976f9cfa84e1 +size 20772619 diff --git a/checkpoint_p0/milestones/checkpoint_001018592_260759552.pth b/checkpoint_p0/milestones/checkpoint_001018592_260759552.pth new file mode 100644 index 0000000000000000000000000000000000000000..31d2fca94b96d7bd25689239fbff015304679c01 --- /dev/null +++ b/checkpoint_p0/milestones/checkpoint_001018592_260759552.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3511299f993933fbe4a4c4995ac6db9368fa670c19494427106f06a72fd252f7 +size 20772619 diff --git a/checkpoint_p0/milestones/checkpoint_001032864_264413184.pth b/checkpoint_p0/milestones/checkpoint_001032864_264413184.pth new file mode 100644 index 0000000000000000000000000000000000000000..1f11645738c2104f230041bb98b32a242a1e0fa5 --- /dev/null +++ b/checkpoint_p0/milestones/checkpoint_001032864_264413184.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:62612955aea32c31c8ac19ee0172402fcce5a1cef7a83ef3763253c59c279d7a +size 20772619 diff --git a/checkpoint_p0/milestones/checkpoint_001047104_268058624.pth b/checkpoint_p0/milestones/checkpoint_001047104_268058624.pth new file mode 100644 index 0000000000000000000000000000000000000000..610d1e1634b33338df3673de7c3b634fac900fab --- /dev/null +++ b/checkpoint_p0/milestones/checkpoint_001047104_268058624.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8c675faeb0b5b1e19a3a7897b63445bf109fc7dabc3ebb6f063dddc4b0bd61f +size 20772619 diff --git a/checkpoint_p0/milestones/checkpoint_001061408_271720448.pth b/checkpoint_p0/milestones/checkpoint_001061408_271720448.pth new file mode 100644 index 0000000000000000000000000000000000000000..2caaf5a3f8db9e641bc5d163542d65569d2e75e5 --- /dev/null +++ b/checkpoint_p0/milestones/checkpoint_001061408_271720448.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51d37c1c8c2fa97b54ad0565b582a6878e11c58e053a2be25591d327e7fd9bbd +size 20772619 diff --git a/checkpoint_p0/milestones/checkpoint_001075680_275374080.pth b/checkpoint_p0/milestones/checkpoint_001075680_275374080.pth new file mode 100644 index 0000000000000000000000000000000000000000..125b3eb1de7a7d8887aac22827ec2c0c413a720c --- /dev/null +++ b/checkpoint_p0/milestones/checkpoint_001075680_275374080.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e94751615b3be69d1103b9c864026560d263c8dad0a4548d81dba2f40e78badb +size 20772619 diff --git a/checkpoint_p0/milestones/checkpoint_001089920_279019520.pth b/checkpoint_p0/milestones/checkpoint_001089920_279019520.pth new file mode 100644 index 0000000000000000000000000000000000000000..09de0ad577e35592ba5dba8825a464d93deb9800 --- /dev/null +++ b/checkpoint_p0/milestones/checkpoint_001089920_279019520.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cbf0fc9ba2a321c8640905622c6a18ad1d3518a141d45b4faefa670f6410bfcb +size 20772619 diff --git a/checkpoint_p0/milestones/checkpoint_001104192_282673152.pth b/checkpoint_p0/milestones/checkpoint_001104192_282673152.pth new file mode 100644 index 0000000000000000000000000000000000000000..0237103aebb6772f25e669833fc843b9d4346a83 --- /dev/null +++ b/checkpoint_p0/milestones/checkpoint_001104192_282673152.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0790ed14a6f01e0eee9f63a378b1cfca6210c1834dafa8904d46aa26d7bcc9a8 +size 20772619 diff --git a/checkpoint_p0/milestones/checkpoint_001118496_286334976.pth b/checkpoint_p0/milestones/checkpoint_001118496_286334976.pth new file mode 100644 index 0000000000000000000000000000000000000000..6b834246b0ac390acc169ebdc442cbe81a0a739b --- /dev/null +++ b/checkpoint_p0/milestones/checkpoint_001118496_286334976.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b80ffa51c0cef9b8f4a0dd0794630f7c4428ec9a911dc6d2b83ebc5d8946b76 +size 20772619 diff --git a/checkpoint_p0/milestones/checkpoint_001132768_289988608.pth b/checkpoint_p0/milestones/checkpoint_001132768_289988608.pth new file mode 100644 index 0000000000000000000000000000000000000000..f271d4f62956be819df6a19da126d8cfed1bdefb --- /dev/null +++ b/checkpoint_p0/milestones/checkpoint_001132768_289988608.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab0d13941f458933f5846cb16e60a73f30f93b5998d74f9071bc21a90ab72ab8 +size 20772619 diff --git a/checkpoint_p1/best_001139808_291790848_reward_1220.070.pth b/checkpoint_p1/best_001139808_291790848_reward_1220.070.pth new file mode 100644 index 0000000000000000000000000000000000000000..552e5ffe278383b264553c7e0102619fbad3192a --- /dev/null +++ b/checkpoint_p1/best_001139808_291790848_reward_1220.070.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09772cfc91c1a568b52798761b6b99ff6f48fac240f8e000992657bf4c9747da +size 20771187 diff --git a/checkpoint_p1/checkpoint_001139648_291749888.pth b/checkpoint_p1/checkpoint_001139648_291749888.pth new file mode 100644 index 0000000000000000000000000000000000000000..a275fa851713abab686baa62d4e4f9ab6bb21fb6 --- /dev/null +++ b/checkpoint_p1/checkpoint_001139648_291749888.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e52ee35ea188cbabb3657c1aecfe09e20c76bf1cafc0b5b341cf257cca76e744 +size 20771651 diff --git a/checkpoint_p1/checkpoint_001140480_291962880.pth b/checkpoint_p1/checkpoint_001140480_291962880.pth new file mode 100644 index 0000000000000000000000000000000000000000..200ed9634ac3b0b946ded9d56b49d190142d4112 --- /dev/null +++ b/checkpoint_p1/checkpoint_001140480_291962880.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d5d56309012510ee7fceea8c35eb66e79469e66394dc97d9341414e6bcaafa4 +size 20771651 diff --git a/checkpoint_p1/milestones/checkpoint_000017472_4472832.pth b/checkpoint_p1/milestones/checkpoint_000017472_4472832.pth new file mode 100644 index 0000000000000000000000000000000000000000..bc4ca0ce8fb4cf2eb955519ff76ec27739e43e54 --- /dev/null +++ b/checkpoint_p1/milestones/checkpoint_000017472_4472832.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49f971e5f89550865d6a0335e1856596f30cd3804cb40eefb0d1919e79883d38 +size 20772507 diff --git a/checkpoint_p1/milestones/checkpoint_000031552_8077312.pth b/checkpoint_p1/milestones/checkpoint_000031552_8077312.pth new file mode 100644 index 0000000000000000000000000000000000000000..11e5a357781757932b5b45fb748cde5f4ab2893e --- /dev/null +++ b/checkpoint_p1/milestones/checkpoint_000031552_8077312.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53d24d60547bde73cfc48e3ed160071867ee0d9d6aeb07a1904e8205f167d1c7 +size 20772507 diff --git a/checkpoint_p1/milestones/checkpoint_000045536_11657216.pth b/checkpoint_p1/milestones/checkpoint_000045536_11657216.pth new file mode 100644 index 0000000000000000000000000000000000000000..af1e7b320a6ea76c167721cf98db38d03c2aaa93 --- /dev/null +++ b/checkpoint_p1/milestones/checkpoint_000045536_11657216.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:00c083ef833a709a54505b6298690b8e56d0dcb7cdd53dc5574993d28ae65326 +size 20772563 diff --git a/checkpoint_p1/milestones/checkpoint_000059680_15278080.pth b/checkpoint_p1/milestones/checkpoint_000059680_15278080.pth new file mode 100644 index 0000000000000000000000000000000000000000..485a944623096a29935eb73f16748b5d5fde13b7 --- /dev/null +++ b/checkpoint_p1/milestones/checkpoint_000059680_15278080.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d2f132850a85e303982cccfc09a476ced5cc346c03d7e820bea1db8d0e5d856 +size 20772563 diff --git a/checkpoint_p1/milestones/checkpoint_000073824_18898944.pth b/checkpoint_p1/milestones/checkpoint_000073824_18898944.pth new file mode 100644 index 0000000000000000000000000000000000000000..40840d96a914aabe4dc6d1abefc1a6236435b4d6 --- /dev/null +++ b/checkpoint_p1/milestones/checkpoint_000073824_18898944.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c0c6c839ba712d125abab366c1457c5ea3bdb7722304d0bdfc626ea0dfc9e76 +size 20772563 diff --git a/checkpoint_p1/milestones/checkpoint_000088032_22536192.pth b/checkpoint_p1/milestones/checkpoint_000088032_22536192.pth new file mode 100644 index 0000000000000000000000000000000000000000..104ba725710eb8886712d96d57baa8bc1218bf3b --- /dev/null +++ b/checkpoint_p1/milestones/checkpoint_000088032_22536192.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6a96ff27bee307d67bce4d03b62839bdb662e1504ee71269d5ea6b32e3aa60a +size 20772563 diff --git a/checkpoint_p1/milestones/checkpoint_000102176_26157056.pth b/checkpoint_p1/milestones/checkpoint_000102176_26157056.pth new file mode 100644 index 0000000000000000000000000000000000000000..3c6ee8988bd1c6267f3889d1c2e889d80fedcd2c --- /dev/null +++ b/checkpoint_p1/milestones/checkpoint_000102176_26157056.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d309a4603f4bb2afdc7409ffd3cae6d8ee6013f240ee1ca53a13f6d36d420562 +size 20772563 diff --git a/checkpoint_p1/milestones/checkpoint_000116256_29761536.pth b/checkpoint_p1/milestones/checkpoint_000116256_29761536.pth new file mode 100644 index 0000000000000000000000000000000000000000..f85057a45a76bc419f2e4d1fdf49ec279ad6e356 --- /dev/null +++ b/checkpoint_p1/milestones/checkpoint_000116256_29761536.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87fa70b0d360e578842823971317c465b8cc3d58f671db8a5441062a7630226e +size 20772563 diff --git a/checkpoint_p1/milestones/checkpoint_000130464_33398784.pth b/checkpoint_p1/milestones/checkpoint_000130464_33398784.pth new file mode 100644 index 0000000000000000000000000000000000000000..e3e9c8e5c9c7a80fb018cbeb2c6a6a6f120e1bd7 --- /dev/null +++ b/checkpoint_p1/milestones/checkpoint_000130464_33398784.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:63f1582dc8ae878d2e9618e62e4fe55e918633a39592574c0b79cb376ca47345 +size 20772563 diff --git a/checkpoint_p1/milestones/checkpoint_000144640_37027840.pth b/checkpoint_p1/milestones/checkpoint_000144640_37027840.pth new file mode 100644 index 0000000000000000000000000000000000000000..10289da2fbe06e214973231dbad4f742d444e013 --- /dev/null +++ b/checkpoint_p1/milestones/checkpoint_000144640_37027840.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b8f8a189964c0699b117e41e34dc826b427a7dfeb2ba1d6a60a3b139bd05516 +size 20772563 diff --git a/checkpoint_p1/milestones/checkpoint_000158752_40640512.pth b/checkpoint_p1/milestones/checkpoint_000158752_40640512.pth new file mode 100644 index 0000000000000000000000000000000000000000..ae83b78cc7f0c62375e0ede244675b297c810bda --- /dev/null +++ b/checkpoint_p1/milestones/checkpoint_000158752_40640512.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff833f157f65ed6f6606eeccaa9df174a5129ccd003cf177330c4dd08c4c30ca +size 20772563 diff --git a/checkpoint_p1/milestones/checkpoint_000172864_44253184.pth b/checkpoint_p1/milestones/checkpoint_000172864_44253184.pth new file mode 100644 index 0000000000000000000000000000000000000000..e446d8bcb8e11a641b61576744a2a7bee459d2e3 --- /dev/null +++ b/checkpoint_p1/milestones/checkpoint_000172864_44253184.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94decafa9230e77a51f0c623c3ac54889ac705acaadb26e4534622dd7d5762c4 +size 20772563 diff --git a/checkpoint_p1/milestones/checkpoint_000186976_47865856.pth b/checkpoint_p1/milestones/checkpoint_000186976_47865856.pth new file mode 100644 index 0000000000000000000000000000000000000000..0e97c60446d8652c11da4e820a3039e34b1928ef --- /dev/null +++ b/checkpoint_p1/milestones/checkpoint_000186976_47865856.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8eee072b5f1867c7ba7929688c8df02206ac7441c4c0bd1b08e9aadbbe5d9186 +size 20772563 diff --git a/checkpoint_p1/milestones/checkpoint_000201120_51486720.pth b/checkpoint_p1/milestones/checkpoint_000201120_51486720.pth new file mode 100644 index 0000000000000000000000000000000000000000..b2dc6688e2ab78cd2bff10f36e5c398a4481279e --- /dev/null +++ b/checkpoint_p1/milestones/checkpoint_000201120_51486720.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf0037228e0b741d01efa6fc67eca53afefae817b278ab5825e9f9318f4ba45a +size 20772563 diff --git a/checkpoint_p1/milestones/checkpoint_000215264_55107584.pth b/checkpoint_p1/milestones/checkpoint_000215264_55107584.pth new file mode 100644 index 0000000000000000000000000000000000000000..3af1660d556bff8fb6bead64afa2ba8742322009 --- /dev/null +++ b/checkpoint_p1/milestones/checkpoint_000215264_55107584.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e25745d6e421c1efa59d1030531cefb560fb0d47176dca8571f0967af94ef8f4 +size 20772563 diff --git a/checkpoint_p1/milestones/checkpoint_000229344_58712064.pth b/checkpoint_p1/milestones/checkpoint_000229344_58712064.pth new file mode 100644 index 0000000000000000000000000000000000000000..debee7d67fac33cd3557d54ac4fa8b37ab76ef3f --- /dev/null +++ b/checkpoint_p1/milestones/checkpoint_000229344_58712064.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d16419c6693ead3e5642c20d2f3a491497ce379a46de244b667205217e62f880 +size 20772563 diff --git a/checkpoint_p1/milestones/checkpoint_000243520_62341120.pth b/checkpoint_p1/milestones/checkpoint_000243520_62341120.pth new file mode 100644 index 0000000000000000000000000000000000000000..9eadc1c597a638b6603fb7123ab3aa4ed0c8a57a --- /dev/null +++ b/checkpoint_p1/milestones/checkpoint_000243520_62341120.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b200bbc52994662568b8d30b89fb98d0738099a28a21632029e9b1ce99c47a5 +size 20772563 diff --git a/checkpoint_p1/milestones/checkpoint_000257664_65961984.pth b/checkpoint_p1/milestones/checkpoint_000257664_65961984.pth new file mode 100644 index 0000000000000000000000000000000000000000..14620bce60662687fa4064af7ba29391685cdadd --- /dev/null +++ b/checkpoint_p1/milestones/checkpoint_000257664_65961984.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab4c64acec1534379c270e5379786395d73680951e3f250e9e18d31af2dbd3de +size 20772563 diff --git a/checkpoint_p1/milestones/checkpoint_000271904_69607424.pth b/checkpoint_p1/milestones/checkpoint_000271904_69607424.pth new file mode 100644 index 0000000000000000000000000000000000000000..db7363585cf2a48d5114a102ef35fa898cb736e0 --- /dev/null +++ b/checkpoint_p1/milestones/checkpoint_000271904_69607424.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95debf7ef9e6c856479e77600b276336eb8f32d9ab21bb9be8205e740fb92f43 +size 20772563 diff --git a/checkpoint_p1/milestones/checkpoint_000286080_73236480.pth b/checkpoint_p1/milestones/checkpoint_000286080_73236480.pth new file mode 100644 index 0000000000000000000000000000000000000000..12c48b75b277883add5af313fa2eba86cae460d8 --- /dev/null +++ b/checkpoint_p1/milestones/checkpoint_000286080_73236480.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:178f5799c3a6fb6004a8f5e9e117e249cdf00547db5f6f1d166bbe2a22b282d5 +size 20772563 diff --git a/checkpoint_p1/milestones/checkpoint_000300320_76881920.pth b/checkpoint_p1/milestones/checkpoint_000300320_76881920.pth new file mode 100644 index 0000000000000000000000000000000000000000..5e8ed4c234c828da10e0034c10d299e8c4509e39 --- /dev/null +++ b/checkpoint_p1/milestones/checkpoint_000300320_76881920.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:794022db9988b6d2694cf88ffe543c55b3ce288847db9ac4ad426b709f7c405a +size 20772563 diff --git a/checkpoint_p1/milestones/checkpoint_000314592_80535552.pth b/checkpoint_p1/milestones/checkpoint_000314592_80535552.pth new file mode 100644 index 0000000000000000000000000000000000000000..a5af33f1af85960becda30412d4f5a14e6ff676a --- /dev/null +++ b/checkpoint_p1/milestones/checkpoint_000314592_80535552.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7af045e9e51162c8dbea14a0bba48611f8f2b16bf6864406477e97a998229e74 +size 20772563 diff --git a/checkpoint_p1/milestones/checkpoint_000328928_84205568.pth b/checkpoint_p1/milestones/checkpoint_000328928_84205568.pth new file mode 100644 index 0000000000000000000000000000000000000000..0db083f5c27e42bddce3483d73a6d6324bbed30b --- /dev/null +++ b/checkpoint_p1/milestones/checkpoint_000328928_84205568.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be9dd1ed6e71d0b667c4e7acda4567c8edb60a39e28995d8e53f1a8c67c2490f +size 20772563 diff --git a/checkpoint_p1/milestones/checkpoint_000343136_87842816.pth b/checkpoint_p1/milestones/checkpoint_000343136_87842816.pth new file mode 100644 index 0000000000000000000000000000000000000000..a7e06219b5db434e8f985a81ecf184244d0abc19 --- /dev/null +++ b/checkpoint_p1/milestones/checkpoint_000343136_87842816.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2bea24ba4672651c9306ceb317499f5cf38afa7ded1ba4d1fda9da45266e1a1f +size 20772563 diff --git a/checkpoint_p1/milestones/checkpoint_000357312_91471872.pth b/checkpoint_p1/milestones/checkpoint_000357312_91471872.pth new file mode 100644 index 0000000000000000000000000000000000000000..2040661fe39860e6cddc12f98c27db0024c4d1b3 --- /dev/null +++ b/checkpoint_p1/milestones/checkpoint_000357312_91471872.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:38a7c4a10c1da18615542d620f754733650fba7ba5a79338e5a03349e950dbf3 +size 20772563 diff --git a/checkpoint_p1/milestones/checkpoint_000371584_95125504.pth b/checkpoint_p1/milestones/checkpoint_000371584_95125504.pth new file mode 100644 index 0000000000000000000000000000000000000000..723651faa1d4c5a518b2eeb9502c11cd675b7ed3 --- /dev/null +++ b/checkpoint_p1/milestones/checkpoint_000371584_95125504.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e61e9812f3fb5a6a50572338f78d0953e0fe54263711efb20e2327da4cd9c73f +size 20772563 diff --git a/checkpoint_p1/milestones/checkpoint_000385888_98787328.pth b/checkpoint_p1/milestones/checkpoint_000385888_98787328.pth new file mode 100644 index 0000000000000000000000000000000000000000..1b9a55f3e6d210d70360e0746047ef6a22ebf687 --- /dev/null +++ b/checkpoint_p1/milestones/checkpoint_000385888_98787328.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f01ab64684469fc92db7e5ef16f5aae893c760ac9dd81c63651876518ccd251 +size 20772563 diff --git a/checkpoint_p1/milestones/checkpoint_000400160_102440960.pth b/checkpoint_p1/milestones/checkpoint_000400160_102440960.pth new file mode 100644 index 0000000000000000000000000000000000000000..f16c1e7ec93529b0f38afdd379ca5cb42cb8118e --- /dev/null +++ b/checkpoint_p1/milestones/checkpoint_000400160_102440960.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6ce6dbad1162219cd3970315fd7b0a4b05c582cb8f3c741a3d95bfb8925764c +size 20772619 diff --git a/checkpoint_p1/milestones/checkpoint_000414336_106070016.pth b/checkpoint_p1/milestones/checkpoint_000414336_106070016.pth new file mode 100644 index 0000000000000000000000000000000000000000..6a0d335d1eccc126ed329127063a7ec263d2b0ee --- /dev/null +++ b/checkpoint_p1/milestones/checkpoint_000414336_106070016.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a70042e89e8b935372aa061505de91da178659284acb7aeafa766f77423e6274 +size 20772619 diff --git a/checkpoint_p1/milestones/checkpoint_000428608_109723648.pth b/checkpoint_p1/milestones/checkpoint_000428608_109723648.pth new file mode 100644 index 0000000000000000000000000000000000000000..90b3d4b2d12b4e5e080a30448a950884b67c1673 --- /dev/null +++ b/checkpoint_p1/milestones/checkpoint_000428608_109723648.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d313a834cbff1db458c687ce7f7012fc7dc41707bb6b9f4f92077060ff191059 +size 20772619 diff --git a/checkpoint_p1/milestones/checkpoint_000442816_113360896.pth b/checkpoint_p1/milestones/checkpoint_000442816_113360896.pth new file mode 100644 index 0000000000000000000000000000000000000000..f50d363fddb47034a37636914a6d37ac449b1a9f --- /dev/null +++ b/checkpoint_p1/milestones/checkpoint_000442816_113360896.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2757af2c31c8bf0f147b25edc5f6357913d61fe1ade2671f81c60fc7477778b4 +size 20772619 diff --git a/checkpoint_p1/milestones/checkpoint_000457024_116998144.pth b/checkpoint_p1/milestones/checkpoint_000457024_116998144.pth new file mode 100644 index 0000000000000000000000000000000000000000..732da37db0a79ef87a50217eea35e528ad4c75b2 --- /dev/null +++ b/checkpoint_p1/milestones/checkpoint_000457024_116998144.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:afa88a8f27276e52749c043bfdfc905a874b82da1220787deb45720895b7d762 +size 20772619 diff --git a/checkpoint_p1/milestones/checkpoint_000471328_120659968.pth b/checkpoint_p1/milestones/checkpoint_000471328_120659968.pth new file mode 100644 index 0000000000000000000000000000000000000000..12b323494e4df95e2cc3869b4c56e961d5443757 --- /dev/null +++ b/checkpoint_p1/milestones/checkpoint_000471328_120659968.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02b052b33478156a55210f1e2d026b44a83849f290173a82fbe4ad17292d99d6 +size 20772619 diff --git a/checkpoint_p1/milestones/checkpoint_000485632_124321792.pth b/checkpoint_p1/milestones/checkpoint_000485632_124321792.pth new file mode 100644 index 0000000000000000000000000000000000000000..61c8384a37094783a868654322a09c9baa140ba1 --- /dev/null +++ b/checkpoint_p1/milestones/checkpoint_000485632_124321792.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f0c004d5cace789a2105d6f48b50780d2472ba2cf1da03745041fcb95afc889 +size 20772619 diff --git a/checkpoint_p1/milestones/checkpoint_000499840_127959040.pth b/checkpoint_p1/milestones/checkpoint_000499840_127959040.pth new file mode 100644 index 0000000000000000000000000000000000000000..82cae68bcf35dbb96f29e75659bef703d6991c51 --- /dev/null +++ b/checkpoint_p1/milestones/checkpoint_000499840_127959040.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf28f8e054619a9308ca92448b6d43eae35a726e5745738e4395625e91701441 +size 20772619 diff --git a/checkpoint_p1/milestones/checkpoint_000514112_131612672.pth b/checkpoint_p1/milestones/checkpoint_000514112_131612672.pth new file mode 100644 index 0000000000000000000000000000000000000000..c7eaf9b4b0930aa27927f51cb21aeff6b515d256 --- /dev/null +++ b/checkpoint_p1/milestones/checkpoint_000514112_131612672.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3813e9895ee8eab23d0279c582b50f8381c44cfff42bebb9fb7e3ad4dfb3cdaf +size 20772619 diff --git a/checkpoint_p1/milestones/checkpoint_000528384_135266304.pth b/checkpoint_p1/milestones/checkpoint_000528384_135266304.pth new file mode 100644 index 0000000000000000000000000000000000000000..385a95adb857ef541faa09cb44a579612ed976bd --- /dev/null +++ b/checkpoint_p1/milestones/checkpoint_000528384_135266304.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7348f89eaf83c05c3bed5e98a25a2b98e01699e01c448bc5710d1d68714e2bab +size 20772619 diff --git a/checkpoint_p1/milestones/checkpoint_000542656_138919936.pth b/checkpoint_p1/milestones/checkpoint_000542656_138919936.pth new file mode 100644 index 0000000000000000000000000000000000000000..e6004cb4c81c90c538b6d6f7e3dce3b973335161 --- /dev/null +++ b/checkpoint_p1/milestones/checkpoint_000542656_138919936.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b6c268290d71db64574d1c5057a0cd8e5c83aab500905819a4ac8308678120e +size 20772619 diff --git a/checkpoint_p1/milestones/checkpoint_000556800_142540800.pth b/checkpoint_p1/milestones/checkpoint_000556800_142540800.pth new file mode 100644 index 0000000000000000000000000000000000000000..7c24c8f56e0da79b7c29f28804b02ec2f59e6662 --- /dev/null +++ b/checkpoint_p1/milestones/checkpoint_000556800_142540800.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f7def208f80a2d03cc3ec0d80f71ff572469b1aa6c6ef644785481125ac2d4e +size 20772619 diff --git a/checkpoint_p1/milestones/checkpoint_000571072_146194432.pth b/checkpoint_p1/milestones/checkpoint_000571072_146194432.pth new file mode 100644 index 0000000000000000000000000000000000000000..5d481bab18e9afd3bbc6081a988fafff9f7d961d --- /dev/null +++ b/checkpoint_p1/milestones/checkpoint_000571072_146194432.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:00709103bae54e2cfc8c15465d313bca0d40854a89bd73948140988712159947 +size 20772619 diff --git a/checkpoint_p1/milestones/checkpoint_000585312_149839872.pth b/checkpoint_p1/milestones/checkpoint_000585312_149839872.pth new file mode 100644 index 0000000000000000000000000000000000000000..45a23125d283fc7dce90acf23ca3c6e02c530332 --- /dev/null +++ b/checkpoint_p1/milestones/checkpoint_000585312_149839872.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:810d19d090f67b0333ccf8013d6306646584b0fde8f0e05fd8573222f4cd0c44 +size 20772619 diff --git a/checkpoint_p1/milestones/checkpoint_000599584_153493504.pth b/checkpoint_p1/milestones/checkpoint_000599584_153493504.pth new file mode 100644 index 0000000000000000000000000000000000000000..ace782c675bf82fe8932664d199868da22be92db --- /dev/null +++ b/checkpoint_p1/milestones/checkpoint_000599584_153493504.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d0764d1887e88cc1b0e9710ee779fa61a93665c8600d235d982fc1a81fe54d4 +size 20772619 diff --git a/checkpoint_p1/milestones/checkpoint_000613856_157147136.pth b/checkpoint_p1/milestones/checkpoint_000613856_157147136.pth new file mode 100644 index 0000000000000000000000000000000000000000..bdebdc3cd96f1ea615dd6246fc3c62cf4f6123ff --- /dev/null +++ b/checkpoint_p1/milestones/checkpoint_000613856_157147136.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d752eda507b0f76595d847398c4d53c042ba41b02c97a72acf03f5954f9da402 +size 20772619 diff --git a/checkpoint_p1/milestones/checkpoint_000628192_160817152.pth b/checkpoint_p1/milestones/checkpoint_000628192_160817152.pth new file mode 100644 index 0000000000000000000000000000000000000000..b9e054d4f648146160c602abef60b0cd177e27c2 --- /dev/null +++ b/checkpoint_p1/milestones/checkpoint_000628192_160817152.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e66966c35567ae80340bf762e07c168ef5999b260b4cf3506453cf51ee66a11 +size 20772619 diff --git a/checkpoint_p1/milestones/checkpoint_000642496_164478976.pth b/checkpoint_p1/milestones/checkpoint_000642496_164478976.pth new file mode 100644 index 0000000000000000000000000000000000000000..0018af2089b02260f30e77d9391ced77fbd92888 --- /dev/null +++ b/checkpoint_p1/milestones/checkpoint_000642496_164478976.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4623bd7817378d48617260c0e5dac95bae6fb561008e80de5fbe18f31fd7aee +size 20772619 diff --git a/checkpoint_p1/milestones/checkpoint_000656800_168140800.pth b/checkpoint_p1/milestones/checkpoint_000656800_168140800.pth new file mode 100644 index 0000000000000000000000000000000000000000..55de52de8199719b1f5bcef34a4ef73b1c9406cc --- /dev/null +++ b/checkpoint_p1/milestones/checkpoint_000656800_168140800.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e514ae55d218975b4b67d1d2b7600986c911c06a43752f79cf63bdeb54e0dbe +size 20772619 diff --git a/checkpoint_p1/milestones/checkpoint_000671168_171819008.pth b/checkpoint_p1/milestones/checkpoint_000671168_171819008.pth new file mode 100644 index 0000000000000000000000000000000000000000..8ed4a5edce5a34d3b53d9158c1397789f0720734 --- /dev/null +++ b/checkpoint_p1/milestones/checkpoint_000671168_171819008.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53a87c27f6f3462999ae1376c2aa75caa26843e2d62537466456b52cac4e2639 +size 20772619 diff --git a/checkpoint_p1/milestones/checkpoint_000685440_175472640.pth b/checkpoint_p1/milestones/checkpoint_000685440_175472640.pth new file mode 100644 index 0000000000000000000000000000000000000000..a602c7312b009c609c7c5ef11fcef302593e1a4a --- /dev/null +++ b/checkpoint_p1/milestones/checkpoint_000685440_175472640.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6583165026fb92cc0079b2ed0d28459c2f0469f300de3d58675cdc70bab2e7df +size 20772619 diff --git a/checkpoint_p1/milestones/checkpoint_000699680_179118080.pth b/checkpoint_p1/milestones/checkpoint_000699680_179118080.pth new file mode 100644 index 0000000000000000000000000000000000000000..3f41f4305cfc8025eee69e271433903e9970a198 --- /dev/null +++ b/checkpoint_p1/milestones/checkpoint_000699680_179118080.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6412c300f6f2c515632bf4d70ab47a97b3570c673138422535fa3e06edba3c4 +size 20772619 diff --git a/checkpoint_p1/milestones/checkpoint_000713952_182771712.pth b/checkpoint_p1/milestones/checkpoint_000713952_182771712.pth new file mode 100644 index 0000000000000000000000000000000000000000..70ecf35c93a814c46440132526f02076455d3bd0 --- /dev/null +++ b/checkpoint_p1/milestones/checkpoint_000713952_182771712.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a05de2a446a5d65a090b210107b505d72c998847a057d7aefc4b27750aef9619 +size 20772619 diff --git a/checkpoint_p1/milestones/checkpoint_000728192_186417152.pth b/checkpoint_p1/milestones/checkpoint_000728192_186417152.pth new file mode 100644 index 0000000000000000000000000000000000000000..75c033d9dc166647ed6ad2c851529a62cf8f3879 --- /dev/null +++ b/checkpoint_p1/milestones/checkpoint_000728192_186417152.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb215cf82aaac84ecb5d601fec18fd7008bf57b741b879ddb8f1a36aded7350a +size 20772619 diff --git a/checkpoint_p1/milestones/checkpoint_000742400_190054400.pth b/checkpoint_p1/milestones/checkpoint_000742400_190054400.pth new file mode 100644 index 0000000000000000000000000000000000000000..a1864919dd2cb3e80df6a064ed97d65434bd0296 --- /dev/null +++ b/checkpoint_p1/milestones/checkpoint_000742400_190054400.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c35d0dbab93987ebce6d9960d5db5aa4431993b511176870fd677b3d3dd13c66 +size 20772619 diff --git a/checkpoint_p1/milestones/checkpoint_000756608_193691648.pth b/checkpoint_p1/milestones/checkpoint_000756608_193691648.pth new file mode 100644 index 0000000000000000000000000000000000000000..24e725af7de06323e6e1092badeceeb911122113 --- /dev/null +++ b/checkpoint_p1/milestones/checkpoint_000756608_193691648.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ba188833e9adec93734b72842f29591d1baf3d2be20e9fcae2a29213efc6633 +size 20772619 diff --git a/checkpoint_p1/milestones/checkpoint_000770848_197337088.pth b/checkpoint_p1/milestones/checkpoint_000770848_197337088.pth new file mode 100644 index 0000000000000000000000000000000000000000..27f571c7714582024700b292cb90f9c27fa3d6a6 --- /dev/null +++ b/checkpoint_p1/milestones/checkpoint_000770848_197337088.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ef99ad32ec53746b5159295452bbf074a267e8614a2684d592ce716ef504783 +size 20772619 diff --git a/checkpoint_p1/milestones/checkpoint_000785024_200966144.pth b/checkpoint_p1/milestones/checkpoint_000785024_200966144.pth new file mode 100644 index 0000000000000000000000000000000000000000..0cafd3deac3ca71e2c9d032e780f5ed741df4a1b --- /dev/null +++ b/checkpoint_p1/milestones/checkpoint_000785024_200966144.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2fe1eea5188b3c5a28a05d5cf243fa5be7d58d03e4cc772f9a721b2ec68fd8f4 +size 20772619 diff --git a/checkpoint_p1/milestones/checkpoint_000799296_204619776.pth b/checkpoint_p1/milestones/checkpoint_000799296_204619776.pth new file mode 100644 index 0000000000000000000000000000000000000000..c0a489f707cd6adcc731a70ebe7bc3d06b1b5b85 --- /dev/null +++ b/checkpoint_p1/milestones/checkpoint_000799296_204619776.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b487f88dbfaadc0b68f1b6b385cd5c37d2a991cd30f235b701cfa004f48e35b8 +size 20772619 diff --git a/checkpoint_p1/milestones/checkpoint_000813536_208265216.pth b/checkpoint_p1/milestones/checkpoint_000813536_208265216.pth new file mode 100644 index 0000000000000000000000000000000000000000..319cd4dd15f4ae596d03943e0402c4a442bc2d70 --- /dev/null +++ b/checkpoint_p1/milestones/checkpoint_000813536_208265216.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ecc7de6f645618c4b862ea8d23f8252b3e4c432e0fc4adc4ca9627072c2bcc0 +size 20772619 diff --git a/checkpoint_p1/milestones/checkpoint_000827808_211918848.pth b/checkpoint_p1/milestones/checkpoint_000827808_211918848.pth new file mode 100644 index 0000000000000000000000000000000000000000..3e6ac474fa5028b54bcfd93785da5e01b2eed29f --- /dev/null +++ b/checkpoint_p1/milestones/checkpoint_000827808_211918848.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:700457d00af7346c54b6acad6f53e084fb14d81ea1c4ebbfe745befb86c42b3e +size 20772619 diff --git a/checkpoint_p1/milestones/checkpoint_000841984_215547904.pth b/checkpoint_p1/milestones/checkpoint_000841984_215547904.pth new file mode 100644 index 0000000000000000000000000000000000000000..a0fd562f4e484b6938959f485afc2c7e5d6d8530 --- /dev/null +++ b/checkpoint_p1/milestones/checkpoint_000841984_215547904.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3954271419800364ff87c3322434bc7b144167872e8a6ff6b54be290433d47f +size 20772619 diff --git a/checkpoint_p1/milestones/checkpoint_000856192_219185152.pth b/checkpoint_p1/milestones/checkpoint_000856192_219185152.pth new file mode 100644 index 0000000000000000000000000000000000000000..d5bcf0447aa14da773485ce247a9964c1cfef7d8 --- /dev/null +++ b/checkpoint_p1/milestones/checkpoint_000856192_219185152.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e2bee360d368251aa19b29aa1fac45bcb4a43367d5b3beb92e4c3293376e57a +size 20772619 diff --git a/checkpoint_p1/milestones/checkpoint_000870432_222830592.pth b/checkpoint_p1/milestones/checkpoint_000870432_222830592.pth new file mode 100644 index 0000000000000000000000000000000000000000..ac18d366cbec708a1f1d49c35e69084baa5b1317 --- /dev/null +++ b/checkpoint_p1/milestones/checkpoint_000870432_222830592.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f84575c620a758d53067652fc165c12f6b522d2da9ff5c830a86b51c0a5e845c +size 20772619 diff --git a/checkpoint_p1/milestones/checkpoint_000884736_226492416.pth b/checkpoint_p1/milestones/checkpoint_000884736_226492416.pth new file mode 100644 index 0000000000000000000000000000000000000000..5fe34869baa7cfc0ebdf18ec76ae5d6bd042e3e1 --- /dev/null +++ b/checkpoint_p1/milestones/checkpoint_000884736_226492416.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3d4b521777facf66c84a06b63858603da4e1a4ddbdc1cb23ab1f561b516058c +size 20772619 diff --git a/checkpoint_p1/milestones/checkpoint_000899008_230146048.pth b/checkpoint_p1/milestones/checkpoint_000899008_230146048.pth new file mode 100644 index 0000000000000000000000000000000000000000..d88af58647af80694c1a1db831276ec8e823d621 --- /dev/null +++ b/checkpoint_p1/milestones/checkpoint_000899008_230146048.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:673f678f82c2d69f1b1739087ddbc9ed89318e2585a2d9e10c700c234ad6481b +size 20772619 diff --git a/checkpoint_p1/milestones/checkpoint_000913248_233791488.pth b/checkpoint_p1/milestones/checkpoint_000913248_233791488.pth new file mode 100644 index 0000000000000000000000000000000000000000..a8b877e591d5f1e29728971c9162ab17c85c0f09 --- /dev/null +++ b/checkpoint_p1/milestones/checkpoint_000913248_233791488.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c533bb00e8be4baf2c81527b12df07a63e3a7ee01fd4f1fe431f140bfaadae09 +size 20772619 diff --git a/checkpoint_p1/milestones/checkpoint_000927552_237453312.pth b/checkpoint_p1/milestones/checkpoint_000927552_237453312.pth new file mode 100644 index 0000000000000000000000000000000000000000..ef327cd75e76c3f16b3bec14e6ee412e59a0ed42 --- /dev/null +++ b/checkpoint_p1/milestones/checkpoint_000927552_237453312.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4b97b0ed9fec1a004e052737005a7d4469260a0d662102bb0e4b76a1540a9e7 +size 20772619 diff --git a/checkpoint_p1/milestones/checkpoint_000941856_241115136.pth b/checkpoint_p1/milestones/checkpoint_000941856_241115136.pth new file mode 100644 index 0000000000000000000000000000000000000000..5469b4ef3772b11a364cf42e8e9ee82e7d5176ca --- /dev/null +++ b/checkpoint_p1/milestones/checkpoint_000941856_241115136.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae317adc22b86e7d5594c17fcb93a7d64866d1e0764ca7a0582dc27b8a915deb +size 20772619 diff --git a/checkpoint_p1/milestones/checkpoint_000956128_244768768.pth b/checkpoint_p1/milestones/checkpoint_000956128_244768768.pth new file mode 100644 index 0000000000000000000000000000000000000000..b9c90f05d4fe9d8f1749dfa247b49d4eefa0a192 --- /dev/null +++ b/checkpoint_p1/milestones/checkpoint_000956128_244768768.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c94efb508213aa22a19ce32928a8148e4edbe82c5379651faac0641461608e9 +size 20772619 diff --git a/checkpoint_p1/milestones/checkpoint_000970272_248389632.pth b/checkpoint_p1/milestones/checkpoint_000970272_248389632.pth new file mode 100644 index 0000000000000000000000000000000000000000..fc862eeeda00b84fc97d7c5ae9a6887dd84aac80 --- /dev/null +++ b/checkpoint_p1/milestones/checkpoint_000970272_248389632.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9285b4ce8bc8f9c9310e9fdc3c681e44dec0cfe4636abf3bfbb055ecfe9a7f93 +size 20772619 diff --git a/checkpoint_p1/milestones/checkpoint_000984544_252043264.pth b/checkpoint_p1/milestones/checkpoint_000984544_252043264.pth new file mode 100644 index 0000000000000000000000000000000000000000..c8521b4f290d83a80d689340adad8838da7d230b --- /dev/null +++ b/checkpoint_p1/milestones/checkpoint_000984544_252043264.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72d0e259bd5ac5799a3eec0347b3065a3e6cc594d99ad8b2cab7fa5c3e25ec2d +size 20772619 diff --git a/checkpoint_p1/milestones/checkpoint_000998848_255705088.pth b/checkpoint_p1/milestones/checkpoint_000998848_255705088.pth new file mode 100644 index 0000000000000000000000000000000000000000..5f838df1c822543d4c6376b832d9f0b1c0482fbe --- /dev/null +++ b/checkpoint_p1/milestones/checkpoint_000998848_255705088.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c6f8fad108748010ef993326c824e8c85393513f34c89d82d7a1b92c2425621 +size 20772619 diff --git a/checkpoint_p1/milestones/checkpoint_001013024_259334144.pth b/checkpoint_p1/milestones/checkpoint_001013024_259334144.pth new file mode 100644 index 0000000000000000000000000000000000000000..f724fa7df7ab3018cdf8cf290d1f959588b620e9 --- /dev/null +++ b/checkpoint_p1/milestones/checkpoint_001013024_259334144.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1d2f408bf6edde7b5a03cd954cb57c678596f223b69ef8feb26d714da471120 +size 20772619 diff --git a/checkpoint_p1/milestones/checkpoint_001027296_262987776.pth b/checkpoint_p1/milestones/checkpoint_001027296_262987776.pth new file mode 100644 index 0000000000000000000000000000000000000000..7df329902fd71d67746d3ef68b086f7068428f73 --- /dev/null +++ b/checkpoint_p1/milestones/checkpoint_001027296_262987776.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:440490ded0e2a957da183415145dda4af9bed66ac37ddab406efdc7a6c2563db +size 20772619 diff --git a/checkpoint_p1/milestones/checkpoint_001041504_266625024.pth b/checkpoint_p1/milestones/checkpoint_001041504_266625024.pth new file mode 100644 index 0000000000000000000000000000000000000000..688ef06454cb24afddfb7019c5ab3bc73c66716a --- /dev/null +++ b/checkpoint_p1/milestones/checkpoint_001041504_266625024.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c579d019a32da7de6b4d6c39d5ba60f2e7d743a32a1f32430eff8d745c5e466 +size 20772619 diff --git a/checkpoint_p1/milestones/checkpoint_001055808_270286848.pth b/checkpoint_p1/milestones/checkpoint_001055808_270286848.pth new file mode 100644 index 0000000000000000000000000000000000000000..2aa8f6dd488740eb2a860de81c77f284caf5a784 --- /dev/null +++ b/checkpoint_p1/milestones/checkpoint_001055808_270286848.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50b7e36bb726f863305fc683e357f69ad181adf3ed68c7ef5eaafae6a787e1a4 +size 20772619 diff --git a/checkpoint_p1/milestones/checkpoint_001069984_273915904.pth b/checkpoint_p1/milestones/checkpoint_001069984_273915904.pth new file mode 100644 index 0000000000000000000000000000000000000000..65bd51c4ff642f6de832c4937342a99373d8bf64 --- /dev/null +++ b/checkpoint_p1/milestones/checkpoint_001069984_273915904.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:005cc309bbd3d79664ace591b03ed833400901905b790abacc1a3ffde029fa02 +size 20772619 diff --git a/checkpoint_p1/milestones/checkpoint_001084192_277553152.pth b/checkpoint_p1/milestones/checkpoint_001084192_277553152.pth new file mode 100644 index 0000000000000000000000000000000000000000..f87709d8b926ec27b201aed44813527d328d1794 --- /dev/null +++ b/checkpoint_p1/milestones/checkpoint_001084192_277553152.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ecc566063d43ce9f7197f4c399af2b4ec0c81e33af8d4fa96c16212b05feab7 +size 20772619 diff --git a/checkpoint_p1/milestones/checkpoint_001098368_281182208.pth b/checkpoint_p1/milestones/checkpoint_001098368_281182208.pth new file mode 100644 index 0000000000000000000000000000000000000000..2c70470ef00be04aa75f8b775a09b56b0b49d2cb --- /dev/null +++ b/checkpoint_p1/milestones/checkpoint_001098368_281182208.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8faa08b40c2609410907d79d743e610e9a31ba106419ec366f42bba53492cb10 +size 20772619 diff --git a/checkpoint_p1/milestones/checkpoint_001112608_284827648.pth b/checkpoint_p1/milestones/checkpoint_001112608_284827648.pth new file mode 100644 index 0000000000000000000000000000000000000000..3f909d48cd50fbcef80a4bdcbd11ab225c93f817 --- /dev/null +++ b/checkpoint_p1/milestones/checkpoint_001112608_284827648.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a50a4a8ca762563669e754ddd48bc01256ca99f61bb35089b9750392d09a264 +size 20772619 diff --git a/checkpoint_p1/milestones/checkpoint_001126784_288456704.pth b/checkpoint_p1/milestones/checkpoint_001126784_288456704.pth new file mode 100644 index 0000000000000000000000000000000000000000..63aa7681e73483cb1ed1b66c31b845e01194bccd --- /dev/null +++ b/checkpoint_p1/milestones/checkpoint_001126784_288456704.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:579d73aa751dfa4667a7ded826ac4fbc2a90ddc337781a0a0796de77ab5f8862 +size 20772619 diff --git a/git.diff b/git.diff index 8251aa45c774e7a868eb7ba8d662d7bb4c2269ff..fc7ad13e3de9b6b82647c814181009f3731ce121 100644 --- a/git.diff +++ b/git.diff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:2464da1601e095c629f46a5ef1ef7322a64234d560931c130d8a8e640a96e217 -size 14449550 +oid sha256:734a2cfe83db19ea719eb536340f696eb5ed83c05a84e7259ce69215c26bf901 +size 14551318 diff --git a/replay.mp4 b/replay.mp4 index cce574d64d238e555d377bcbc307e1472b768893..2480b85545583c17cb494dffb63a65f1189a94b3 100644 Binary files a/replay.mp4 and b/replay.mp4 differ diff --git a/sf_log.txt b/sf_log.txt index fd51ef5397dd536668fbb46b982c9d7d53c05ffc..ab3789034e1b15004e4f94f5afa29f20fe3b4de3 100644 --- a/sf_log.txt +++ b/sf_log.txt @@ -1,1478 +1,3 @@ -[2023-10-17 12:40:56,748][112888] Saving configuration to ./train_atari/atari_asteroid_APPO/config.json... -[2023-10-17 12:40:57,065][112888] Rollout worker 0 uses device cpu -[2023-10-17 12:40:57,066][112888] Rollout worker 1 uses device cpu -[2023-10-17 12:40:57,066][112888] Rollout worker 2 uses device cpu -[2023-10-17 12:40:57,067][112888] Rollout worker 3 uses device cpu -[2023-10-17 12:40:57,067][112888] Rollout worker 4 uses device cpu -[2023-10-17 12:40:57,068][112888] Rollout worker 5 uses device cpu -[2023-10-17 12:40:57,068][112888] Rollout worker 6 uses device cpu -[2023-10-17 12:40:57,069][112888] Rollout worker 7 uses device cpu -[2023-10-17 12:40:57,069][112888] Rollout worker 8 uses device cpu -[2023-10-17 12:40:57,069][112888] Rollout worker 9 uses device cpu -[2023-10-17 12:40:57,070][112888] Rollout worker 10 uses device cpu -[2023-10-17 12:40:57,070][112888] Rollout worker 11 uses device cpu -[2023-10-17 12:40:57,071][112888] Rollout worker 12 uses device cpu -[2023-10-17 12:40:57,071][112888] Rollout worker 13 uses device cpu -[2023-10-17 12:40:57,072][112888] Rollout worker 14 uses device cpu -[2023-10-17 12:40:57,072][112888] Rollout worker 15 uses device cpu -[2023-10-17 12:40:57,355][112888] Using GPUs [0] for process 0 (actually maps to GPUs [0]) -[2023-10-17 12:40:57,355][112888] InferenceWorker_p0-w0: min num requests: 2 -[2023-10-17 12:40:57,358][112888] Using GPUs [1] for process 1 (actually maps to GPUs [1]) -[2023-10-17 12:40:57,359][112888] InferenceWorker_p1-w0: min num requests: 2 -[2023-10-17 12:40:57,404][112888] Starting all processes... -[2023-10-17 12:40:57,405][112888] Starting process learner_proc0 -[2023-10-17 12:40:59,103][112888] Starting process learner_proc1 -[2023-10-17 12:40:59,107][113622] Using GPUs [0] for process 0 (actually maps to GPUs [0]) -[2023-10-17 12:40:59,107][113622] Set environment var CUDA_VISIBLE_DEVICES to '0' (GPU indices [0]) for learning process 0 -[2023-10-17 12:40:59,125][113622] Num visible devices: 1 -[2023-10-17 12:40:59,151][113622] Setting fixed seed 1234 -[2023-10-17 12:40:59,152][113622] Using GPUs [0] for process 0 (actually maps to GPUs [0]) -[2023-10-17 12:40:59,152][113622] Initializing actor-critic model on device cuda:0 -[2023-10-17 12:40:59,153][113622] RunningMeanStd input shape: (4, 84, 84) -[2023-10-17 12:40:59,153][113622] RunningMeanStd input shape: (1,) -[2023-10-17 12:40:59,164][113622] ConvEncoder: input_channels=4 -[2023-10-17 12:40:59,325][113622] Conv encoder output size: 512 -[2023-10-17 12:40:59,327][113622] Created Actor Critic model with architecture: -[2023-10-17 12:40:59,327][113622] ActorCriticSharedWeights( - (obs_normalizer): ObservationNormalizer( - (running_mean_std): RunningMeanStdDictInPlace( - (running_mean_std): ModuleDict( - (obs): RunningMeanStdInPlace() - ) - ) - ) - (returns_normalizer): RecursiveScriptModule(original_name=RunningMeanStdInPlace) - (encoder): MultiInputEncoder( - (encoders): ModuleDict( - (obs): ConvEncoder( - (enc): RecursiveScriptModule( - original_name=ConvEncoderImpl - (conv_head): RecursiveScriptModule( - original_name=Sequential - (0): RecursiveScriptModule(original_name=Conv2d) - (1): RecursiveScriptModule(original_name=ReLU) - (2): RecursiveScriptModule(original_name=Conv2d) - (3): RecursiveScriptModule(original_name=ReLU) - (4): RecursiveScriptModule(original_name=Conv2d) - (5): RecursiveScriptModule(original_name=ReLU) - ) - (mlp_layers): RecursiveScriptModule( - original_name=Sequential - (0): RecursiveScriptModule(original_name=Linear) - (1): RecursiveScriptModule(original_name=ReLU) - ) - ) - ) - ) - ) - (core): ModelCoreIdentity() - (decoder): MlpDecoder( - (mlp): Identity() - ) - (critic_linear): Linear(in_features=512, out_features=1, bias=True) - (action_parameterization): ActionParameterizationDefault( - (distribution_linear): Linear(in_features=512, out_features=14, bias=True) - ) -) -[2023-10-17 12:40:59,912][113622] Using optimizer -[2023-10-17 12:40:59,913][113622] No checkpoints found -[2023-10-17 12:40:59,913][113622] Did not load from checkpoint, starting from scratch! -[2023-10-17 12:40:59,913][113622] Initialized policy 0 weights for model version 0 -[2023-10-17 12:40:59,914][113622] LearnerWorker_p0 finished initialization! -[2023-10-17 12:40:59,915][113622] Using GPUs [0] for process 0 (actually maps to GPUs [0]) -[2023-10-17 12:41:00,851][112888] Starting all processes... -[2023-10-17 12:41:00,855][113701] Using GPUs [1] for process 1 (actually maps to GPUs [1]) -[2023-10-17 12:41:00,855][113701] Set environment var CUDA_VISIBLE_DEVICES to '1' (GPU indices [1]) for learning process 1 -[2023-10-17 12:41:00,859][112888] Starting process inference_proc0-0 -[2023-10-17 12:41:00,860][112888] Starting process inference_proc1-0 -[2023-10-17 12:41:00,860][112888] Starting process rollout_proc0 -[2023-10-17 12:41:00,873][113701] Num visible devices: 1 -[2023-10-17 12:41:00,860][112888] Starting process rollout_proc1 -[2023-10-17 12:41:00,861][112888] Starting process rollout_proc2 -[2023-10-17 12:41:00,861][112888] Starting process rollout_proc3 -[2023-10-17 12:41:00,892][113701] Setting fixed seed 1234 -[2023-10-17 12:41:00,864][112888] Starting process rollout_proc4 -[2023-10-17 12:41:00,893][113701] Using GPUs [0] for process 1 (actually maps to GPUs [1]) -[2023-10-17 12:41:00,893][113701] Initializing actor-critic model on device cuda:0 -[2023-10-17 12:41:00,894][113701] RunningMeanStd input shape: (4, 84, 84) -[2023-10-17 12:41:00,894][113701] RunningMeanStd input shape: (1,) -[2023-10-17 12:41:00,865][112888] Starting process rollout_proc5 -[2023-10-17 12:41:00,870][112888] Starting process rollout_proc6 -[2023-10-17 12:41:00,875][112888] Starting process rollout_proc7 -[2023-10-17 12:41:00,875][112888] Starting process rollout_proc8 -[2023-10-17 12:41:00,877][112888] Starting process rollout_proc9 -[2023-10-17 12:41:00,906][113701] ConvEncoder: input_channels=4 -[2023-10-17 12:41:00,883][112888] Starting process rollout_proc10 -[2023-10-17 12:41:00,883][112888] Starting process rollout_proc11 -[2023-10-17 12:41:00,891][112888] Starting process rollout_proc12 -[2023-10-17 12:41:00,892][112888] Starting process rollout_proc13 -[2023-10-17 12:41:01,358][113701] Conv encoder output size: 512 -[2023-10-17 12:41:01,361][113701] Created Actor Critic model with architecture: -[2023-10-17 12:41:01,361][113701] ActorCriticSharedWeights( - (obs_normalizer): ObservationNormalizer( - (running_mean_std): RunningMeanStdDictInPlace( - (running_mean_std): ModuleDict( - (obs): RunningMeanStdInPlace() - ) - ) - ) - (returns_normalizer): RecursiveScriptModule(original_name=RunningMeanStdInPlace) - (encoder): MultiInputEncoder( - (encoders): ModuleDict( - (obs): ConvEncoder( - (enc): RecursiveScriptModule( - original_name=ConvEncoderImpl - (conv_head): RecursiveScriptModule( - original_name=Sequential - (0): RecursiveScriptModule(original_name=Conv2d) - (1): RecursiveScriptModule(original_name=ReLU) - (2): RecursiveScriptModule(original_name=Conv2d) - (3): RecursiveScriptModule(original_name=ReLU) - (4): RecursiveScriptModule(original_name=Conv2d) - (5): RecursiveScriptModule(original_name=ReLU) - ) - (mlp_layers): RecursiveScriptModule( - original_name=Sequential - (0): RecursiveScriptModule(original_name=Linear) - (1): RecursiveScriptModule(original_name=ReLU) - ) - ) - ) - ) - ) - (core): ModelCoreIdentity() - (decoder): MlpDecoder( - (mlp): Identity() - ) - (critic_linear): Linear(in_features=512, out_features=1, bias=True) - (action_parameterization): ActionParameterizationDefault( - (distribution_linear): Linear(in_features=512, out_features=14, bias=True) - ) -) -[2023-10-17 12:41:02,052][113701] Using optimizer -[2023-10-17 12:41:02,053][113701] No checkpoints found -[2023-10-17 12:41:02,053][113701] Did not load from checkpoint, starting from scratch! -[2023-10-17 12:41:02,053][113701] Initialized policy 1 weights for model version 0 -[2023-10-17 12:41:02,054][113701] LearnerWorker_p1 finished initialization! -[2023-10-17 12:41:02,055][113701] Using GPUs [0] for process 1 (actually maps to GPUs [1]) -[2023-10-17 12:41:03,037][112888] Starting process rollout_proc14 -[2023-10-17 12:41:03,042][113888] Using GPUs [1] for process 1 (actually maps to GPUs [1]) -[2023-10-17 12:41:03,042][113888] Set environment var CUDA_VISIBLE_DEVICES to '1' (GPU indices [1]) for inference process 1 -[2023-10-17 12:41:03,061][113888] Num visible devices: 1 -[2023-10-17 12:41:03,079][112888] Starting process rollout_proc15 -[2023-10-17 12:41:03,090][113926] Worker 6 uses CPU cores [12, 13] -[2023-10-17 12:41:03,098][113932] Worker 10 uses CPU cores [20, 21] -[2023-10-17 12:41:03,102][113924] Worker 3 uses CPU cores [6, 7] -[2023-10-17 12:41:03,117][113927] Worker 8 uses CPU cores [16, 17] -[2023-10-17 12:41:03,194][113930] Worker 7 uses CPU cores [14, 15] -[2023-10-17 12:41:03,282][113925] Worker 5 uses CPU cores [10, 11] -[2023-10-17 12:41:03,335][113929] Worker 4 uses CPU cores [8, 9] -[2023-10-17 12:41:03,338][113934] Worker 12 uses CPU cores [24, 25] -[2023-10-17 12:41:03,447][113920] Worker 0 uses CPU cores [0, 1] -[2023-10-17 12:41:03,490][113922] Worker 2 uses CPU cores [4, 5] -[2023-10-17 12:41:03,664][113933] Worker 13 uses CPU cores [26, 27] -[2023-10-17 12:41:03,672][113887] Using GPUs [0] for process 0 (actually maps to GPUs [0]) -[2023-10-17 12:41:03,672][113887] Set environment var CUDA_VISIBLE_DEVICES to '0' (GPU indices [0]) for inference process 0 -[2023-10-17 12:41:03,678][113923] Worker 1 uses CPU cores [2, 3] -[2023-10-17 12:41:03,690][113887] Num visible devices: 1 -[2023-10-17 12:41:03,789][113888] RunningMeanStd input shape: (4, 84, 84) -[2023-10-17 12:41:03,789][113888] RunningMeanStd input shape: (1,) -[2023-10-17 12:41:03,801][113888] ConvEncoder: input_channels=4 -[2023-10-17 12:41:03,881][113931] Worker 11 uses CPU cores [22, 23] -[2023-10-17 12:41:03,908][113888] Conv encoder output size: 512 -[2023-10-17 12:41:03,942][113928] Worker 9 uses CPU cores [18, 19] -[2023-10-17 12:41:04,285][113887] RunningMeanStd input shape: (4, 84, 84) -[2023-10-17 12:41:04,286][113887] RunningMeanStd input shape: (1,) -[2023-10-17 12:41:04,297][113887] ConvEncoder: input_channels=4 -[2023-10-17 12:41:04,401][113887] Conv encoder output size: 512 -[2023-10-17 12:41:04,969][114609] Worker 15 uses CPU cores [30, 31] -[2023-10-17 12:41:04,979][112888] Inference worker 1-0 is ready! -[2023-10-17 12:41:04,980][114575] Worker 14 uses CPU cores [28, 29] -[2023-10-17 12:41:04,980][112888] Inference worker 0-0 is ready! -[2023-10-17 12:41:04,981][112888] All inference workers are ready! Signal rollout workers to start! -[2023-10-17 12:41:04,982][113924] EnvRunner 3-0 uses policy 1 -[2023-10-17 12:41:04,982][113930] EnvRunner 7-0 uses policy 1 -[2023-10-17 12:41:04,982][113928] EnvRunner 9-0 uses policy 1 -[2023-10-17 12:41:04,982][113923] EnvRunner 1-0 uses policy 1 -[2023-10-17 12:41:04,982][113931] EnvRunner 11-0 uses policy 1 -[2023-10-17 12:41:04,982][113922] EnvRunner 2-0 uses policy 0 -[2023-10-17 12:41:04,982][113920] EnvRunner 0-0 uses policy 0 -[2023-10-17 12:41:04,982][113933] EnvRunner 13-0 uses policy 1 -[2023-10-17 12:41:04,982][113932] EnvRunner 10-0 uses policy 0 -[2023-10-17 12:41:04,982][113927] EnvRunner 8-0 uses policy 0 -[2023-10-17 12:41:04,982][113934] EnvRunner 12-0 uses policy 0 -[2023-10-17 12:41:04,983][113926] EnvRunner 6-0 uses policy 0 -[2023-10-17 12:41:04,982][112888] Fps is (10 sec: nan, 60 sec: nan, 300 sec: nan). Total num frames: 0. Throughput: 0: nan, 1: nan. Samples: 0. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-10-17 12:41:04,983][113925] EnvRunner 5-0 uses policy 1 -[2023-10-17 12:41:04,983][113929] EnvRunner 4-0 uses policy 0 -[2023-10-17 12:41:05,071][114609] EnvRunner 15-0 uses policy 1 -[2023-10-17 12:41:05,131][114575] EnvRunner 14-0 uses policy 0 -[2023-10-17 12:41:06,626][113924] EnvRunner 3-1 uses policy 1 -[2023-10-17 12:41:06,629][113928] EnvRunner 9-1 uses policy 1 -[2023-10-17 12:41:06,643][113923] EnvRunner 1-1 uses policy 1 -[2023-10-17 12:41:06,665][113931] EnvRunner 11-1 uses policy 1 -[2023-10-17 12:41:06,683][113926] EnvRunner 6-1 uses policy 0 -[2023-10-17 12:41:06,714][113920] EnvRunner 0-1 uses policy 0 -[2023-10-17 12:41:06,715][113927] EnvRunner 8-1 uses policy 0 -[2023-10-17 12:41:06,788][114575] EnvRunner 14-1 uses policy 0 -[2023-10-17 12:41:07,342][112888] Heartbeat connected on Batcher_0 -[2023-10-17 12:41:07,345][112888] Heartbeat connected on LearnerWorker_p0 -[2023-10-17 12:41:07,348][112888] Heartbeat connected on Batcher_1 -[2023-10-17 12:41:07,351][112888] Heartbeat connected on LearnerWorker_p1 -[2023-10-17 12:41:07,385][112888] Heartbeat connected on InferenceWorker_p0-w0 -[2023-10-17 12:41:07,406][112888] Heartbeat connected on InferenceWorker_p1-w0 -[2023-10-17 12:41:07,857][112888] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0, 1: 0.0. Samples: 0. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-10-17 12:41:07,968][113930] EnvRunner 7-1 uses policy 1 -[2023-10-17 12:41:07,999][113934] EnvRunner 12-1 uses policy 0 -[2023-10-17 12:41:08,000][113925] EnvRunner 5-1 uses policy 1 -[2023-10-17 12:41:08,000][113933] EnvRunner 13-1 uses policy 1 -[2023-10-17 12:41:08,004][113929] EnvRunner 4-1 uses policy 0 -[2023-10-17 12:41:08,005][113932] EnvRunner 10-1 uses policy 0 -[2023-10-17 12:41:08,025][113922] EnvRunner 2-1 uses policy 0 -[2023-10-17 12:41:08,097][114609] EnvRunner 15-1 uses policy 1 -[2023-10-17 12:41:08,212][112888] Heartbeat connected on RolloutWorker_w9 -[2023-10-17 12:41:08,212][112888] Heartbeat connected on RolloutWorker_w3 -[2023-10-17 12:41:08,236][112888] Heartbeat connected on RolloutWorker_w1 -[2023-10-17 12:41:08,263][112888] Heartbeat connected on RolloutWorker_w11 -[2023-10-17 12:41:08,298][112888] Heartbeat connected on RolloutWorker_w8 -[2023-10-17 12:41:08,308][112888] Heartbeat connected on RolloutWorker_w0 -[2023-10-17 12:41:08,337][112888] Heartbeat connected on RolloutWorker_w6 -[2023-10-17 12:41:08,379][112888] Heartbeat connected on RolloutWorker_w14 -[2023-10-17 12:41:10,894][112888] Heartbeat connected on RolloutWorker_w7 -[2023-10-17 12:41:10,912][112888] Heartbeat connected on RolloutWorker_w5 -[2023-10-17 12:41:10,912][112888] Heartbeat connected on RolloutWorker_w4 -[2023-10-17 12:41:10,918][112888] Heartbeat connected on RolloutWorker_w13 -[2023-10-17 12:41:10,930][112888] Heartbeat connected on RolloutWorker_w12 -[2023-10-17 12:41:10,943][112888] Heartbeat connected on RolloutWorker_w10 -[2023-10-17 12:41:10,951][112888] Heartbeat connected on RolloutWorker_w2 -[2023-10-17 12:41:11,035][112888] Heartbeat connected on RolloutWorker_w15 -[2023-10-17 12:41:12,857][112888] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 436.3, 1: 315.4. Samples: 5920. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-10-17 12:41:12,858][112888] Avg episode reward: [(0, '2.176'), (1, '2.667')] -[2023-10-17 12:41:15,996][113701] Signal inference workers to stop experience collection... -[2023-10-17 12:41:16,000][113888] InferenceWorker_p1-w0: stopping experience collection -[2023-10-17 12:41:16,017][113887] InferenceWorker_p0-w0: stopping experience collection -[2023-10-17 12:41:17,511][113701] Signal inference workers to resume experience collection... -[2023-10-17 12:41:17,512][113888] InferenceWorker_p1-w0: resuming experience collection -[2023-10-17 12:41:17,512][113887] InferenceWorker_p0-w0: resuming experience collection -[2023-10-17 12:41:17,857][112888] Fps is (10 sec: 819.2, 60 sec: 636.3, 300 sec: 636.3). Total num frames: 8192. Throughput: 0: 1520.2, 1: 1453.7. Samples: 38288. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-10-17 12:41:17,858][112888] Avg episode reward: [(0, '2.550'), (1, '2.942')] -[2023-10-17 12:41:17,967][113887] Updated weights for policy 0, policy_version 20 (0.0010) -[2023-10-17 12:41:18,345][113622] Signal inference workers to stop experience collection... -[2023-10-17 12:41:18,468][113622] Signal inference workers to resume experience collection... -[2023-10-17 12:41:18,769][113888] Updated weights for policy 1, policy_version 40 (0.0366) -[2023-10-17 12:41:19,149][113888] Updated weights for policy 1, policy_version 50 (0.0008) -[2023-10-17 12:41:19,521][113888] Updated weights for policy 1, policy_version 60 (0.0008) -[2023-10-17 12:41:19,746][113887] Updated weights for policy 0, policy_version 33 (0.0378) -[2023-10-17 12:41:20,127][113887] Updated weights for policy 0, policy_version 43 (0.0012) -[2023-10-17 12:41:20,504][113887] Updated weights for policy 0, policy_version 53 (0.0008) -[2023-10-17 12:41:20,884][113887] Updated weights for policy 0, policy_version 63 (0.0010) -[2023-10-17 12:41:21,667][113888] Updated weights for policy 1, policy_version 70 (0.0010) -[2023-10-17 12:41:22,047][113888] Updated weights for policy 1, policy_version 80 (0.0010) -[2023-10-17 12:41:22,393][113887] Updated weights for policy 0, policy_version 76 (0.0008) -[2023-10-17 12:41:22,422][113888] Updated weights for policy 1, policy_version 90 (0.0009) -[2023-10-17 12:41:22,785][113887] Updated weights for policy 0, policy_version 86 (0.0010) -[2023-10-17 12:41:22,857][112888] Fps is (10 sec: 4095.9, 60 sec: 2291.5, 300 sec: 2291.5). Total num frames: 40960. Throughput: 0: 1807.0, 1: 1688.2. Samples: 62476. Policy #0 lag: (min: 21.0, avg: 21.0, max: 21.0) -[2023-10-17 12:41:22,858][112888] Avg episode reward: [(0, '3.860'), (1, '3.620')] -[2023-10-17 12:41:23,168][113887] Updated weights for policy 0, policy_version 96 (0.0011) -[2023-10-17 12:41:24,366][113888] Updated weights for policy 1, policy_version 100 (0.0010) -[2023-10-17 12:41:24,743][113888] Updated weights for policy 1, policy_version 110 (0.0007) -[2023-10-17 12:41:24,868][113887] Updated weights for policy 0, policy_version 106 (0.0011) -[2023-10-17 12:41:25,126][113888] Updated weights for policy 1, policy_version 120 (0.0007) -[2023-10-17 12:41:25,255][113887] Updated weights for policy 0, policy_version 116 (0.0007) -[2023-10-17 12:41:25,633][113887] Updated weights for policy 0, policy_version 126 (0.0007) -[2023-10-17 12:41:26,860][113888] Updated weights for policy 1, policy_version 130 (0.0009) -[2023-10-17 12:41:27,230][113888] Updated weights for policy 1, policy_version 140 (0.0012) -[2023-10-17 12:41:27,232][113887] Updated weights for policy 0, policy_version 136 (0.0007) -[2023-10-17 12:41:27,618][113887] Updated weights for policy 0, policy_version 146 (0.0009) -[2023-10-17 12:41:27,701][113888] Updated weights for policy 1, policy_version 152 (0.0012) -[2023-10-17 12:41:27,857][112888] Fps is (10 sec: 5734.4, 60 sec: 2865.0, 300 sec: 2865.0). Total num frames: 65536. Throughput: 0: 1799.7, 1: 1684.7. Samples: 79704. Policy #0 lag: (min: 63.0, avg: 82.5, max: 95.0) -[2023-10-17 12:41:27,858][112888] Avg episode reward: [(0, '4.020'), (1, '3.780')] -[2023-10-17 12:41:27,993][113887] Updated weights for policy 0, policy_version 156 (0.0009) -[2023-10-17 12:41:29,445][113887] Updated weights for policy 0, policy_version 166 (0.0009) -[2023-10-17 12:41:29,738][113888] Updated weights for policy 1, policy_version 162 (0.0010) -[2023-10-17 12:41:29,817][113887] Updated weights for policy 0, policy_version 176 (0.0012) -[2023-10-17 12:41:30,122][113888] Updated weights for policy 1, policy_version 172 (0.0007) -[2023-10-17 12:41:30,196][113887] Updated weights for policy 0, policy_version 186 (0.0009) -[2023-10-17 12:41:30,496][113888] Updated weights for policy 1, policy_version 182 (0.0010) -[2023-10-17 12:41:30,866][113888] Updated weights for policy 1, policy_version 192 (0.0012) -[2023-10-17 12:41:32,132][113887] Updated weights for policy 0, policy_version 196 (0.0007) -[2023-10-17 12:41:32,455][113888] Updated weights for policy 1, policy_version 202 (0.0011) -[2023-10-17 12:41:32,503][113887] Updated weights for policy 0, policy_version 206 (0.0007) -[2023-10-17 12:41:32,839][113888] Updated weights for policy 1, policy_version 212 (0.0009) -[2023-10-17 12:41:32,857][112888] Fps is (10 sec: 5734.5, 60 sec: 3526.6, 300 sec: 3526.6). Total num frames: 98304. Throughput: 0: 2129.8, 1: 1981.7. Samples: 114608. Policy #0 lag: (min: 31.0, avg: 52.3, max: 91.0) -[2023-10-17 12:41:32,858][112888] Avg episode reward: [(0, '4.060'), (1, '4.100')] -[2023-10-17 12:41:32,889][113887] Updated weights for policy 0, policy_version 216 (0.0010) -[2023-10-17 12:41:33,211][113888] Updated weights for policy 1, policy_version 222 (0.0008) -[2023-10-17 12:41:34,492][113887] Updated weights for policy 0, policy_version 226 (0.0009) -[2023-10-17 12:41:34,871][113887] Updated weights for policy 0, policy_version 236 (0.0007) -[2023-10-17 12:41:35,258][113887] Updated weights for policy 0, policy_version 246 (0.0007) -[2023-10-17 12:41:35,377][113888] Updated weights for policy 1, policy_version 232 (0.0009) -[2023-10-17 12:41:35,640][113887] Updated weights for policy 0, policy_version 256 (0.0011) -[2023-10-17 12:41:35,746][113888] Updated weights for policy 1, policy_version 242 (0.0009) -[2023-10-17 12:41:36,118][113888] Updated weights for policy 1, policy_version 252 (0.0009) -[2023-10-17 12:41:37,805][113887] Updated weights for policy 0, policy_version 266 (0.0012) -[2023-10-17 12:41:37,857][112888] Fps is (10 sec: 6553.4, 60 sec: 3987.0, 300 sec: 3987.0). Total num frames: 131072. Throughput: 0: 2342.6, 1: 2244.1. Samples: 150788. Policy #0 lag: (min: 31.0, avg: 52.2, max: 77.0) -[2023-10-17 12:41:37,859][112888] Avg episode reward: [(0, '3.630'), (1, '3.770')] -[2023-10-17 12:41:38,163][113888] Updated weights for policy 1, policy_version 262 (0.0009) -[2023-10-17 12:41:38,181][113887] Updated weights for policy 0, policy_version 276 (0.0011) -[2023-10-17 12:41:38,553][113887] Updated weights for policy 0, policy_version 286 (0.0010) -[2023-10-17 12:41:38,617][113888] Updated weights for policy 1, policy_version 274 (0.0007) -[2023-10-17 12:41:38,998][113888] Updated weights for policy 1, policy_version 284 (0.0009) -[2023-10-17 12:41:40,553][113888] Updated weights for policy 1, policy_version 294 (0.0010) -[2023-10-17 12:41:40,597][113887] Updated weights for policy 0, policy_version 296 (0.0012) -[2023-10-17 12:41:40,938][113888] Updated weights for policy 1, policy_version 304 (0.0010) -[2023-10-17 12:41:40,973][113887] Updated weights for policy 0, policy_version 306 (0.0012) -[2023-10-17 12:41:41,308][113888] Updated weights for policy 1, policy_version 314 (0.0008) -[2023-10-17 12:41:41,350][113887] Updated weights for policy 0, policy_version 316 (0.0010) -[2023-10-17 12:41:42,857][112888] Fps is (10 sec: 6553.4, 60 sec: 4325.8, 300 sec: 4325.8). Total num frames: 163840. Throughput: 0: 2251.2, 1: 2216.2. Samples: 169204. Policy #0 lag: (min: 31.0, avg: 45.4, max: 64.0) -[2023-10-17 12:41:42,859][112888] Avg episode reward: [(0, '3.820'), (1, '3.820')] -[2023-10-17 12:41:43,283][113888] Updated weights for policy 1, policy_version 324 (0.0009) -[2023-10-17 12:41:43,627][113887] Updated weights for policy 0, policy_version 326 (0.0009) -[2023-10-17 12:41:43,649][113888] Updated weights for policy 1, policy_version 334 (0.0011) -[2023-10-17 12:41:44,008][113887] Updated weights for policy 0, policy_version 336 (0.0011) -[2023-10-17 12:41:44,026][113888] Updated weights for policy 1, policy_version 344 (0.0011) -[2023-10-17 12:41:44,384][113887] Updated weights for policy 0, policy_version 346 (0.0009) -[2023-10-17 12:41:45,779][113888] Updated weights for policy 1, policy_version 354 (0.0011) -[2023-10-17 12:41:46,133][113887] Updated weights for policy 0, policy_version 356 (0.0009) -[2023-10-17 12:41:46,146][113888] Updated weights for policy 1, policy_version 364 (0.0011) -[2023-10-17 12:41:46,509][113887] Updated weights for policy 0, policy_version 366 (0.0011) -[2023-10-17 12:41:46,526][113888] Updated weights for policy 1, policy_version 374 (0.0011) -[2023-10-17 12:41:46,898][113887] Updated weights for policy 0, policy_version 376 (0.0011) -[2023-10-17 12:41:46,899][113888] Updated weights for policy 1, policy_version 384 (0.0012) -[2023-10-17 12:41:47,857][112888] Fps is (10 sec: 6553.8, 60 sec: 4585.6, 300 sec: 4585.6). Total num frames: 196608. Throughput: 0: 2398.1, 1: 2393.3. Samples: 205428. Policy #0 lag: (min: 26.0, avg: 43.6, max: 58.0) -[2023-10-17 12:41:47,858][112888] Avg episode reward: [(0, '3.570'), (1, '4.220')] -[2023-10-17 12:41:48,630][113887] Updated weights for policy 0, policy_version 386 (0.0009) -[2023-10-17 12:41:48,872][113888] Updated weights for policy 1, policy_version 394 (0.0010) -[2023-10-17 12:41:49,016][113887] Updated weights for policy 0, policy_version 396 (0.0010) -[2023-10-17 12:41:49,239][113888] Updated weights for policy 1, policy_version 404 (0.0010) -[2023-10-17 12:41:49,398][113887] Updated weights for policy 0, policy_version 406 (0.0012) -[2023-10-17 12:41:49,614][113888] Updated weights for policy 1, policy_version 414 (0.0007) -[2023-10-17 12:41:49,769][113887] Updated weights for policy 0, policy_version 416 (0.0011) -[2023-10-17 12:41:51,477][113888] Updated weights for policy 1, policy_version 424 (0.0010) -[2023-10-17 12:41:51,858][113888] Updated weights for policy 1, policy_version 434 (0.0010) -[2023-10-17 12:41:51,872][113887] Updated weights for policy 0, policy_version 426 (0.0007) -[2023-10-17 12:41:52,232][113888] Updated weights for policy 1, policy_version 444 (0.0009) -[2023-10-17 12:41:52,258][113887] Updated weights for policy 0, policy_version 436 (0.0010) -[2023-10-17 12:41:52,639][113887] Updated weights for policy 0, policy_version 446 (0.0012) -[2023-10-17 12:41:52,857][112888] Fps is (10 sec: 6553.8, 60 sec: 4791.2, 300 sec: 4791.2). Total num frames: 229376. Throughput: 0: 2692.4, 1: 2704.6. Samples: 242868. Policy #0 lag: (min: 22.0, avg: 34.6, max: 54.0) -[2023-10-17 12:41:52,858][112888] Avg episode reward: [(0, '4.060'), (1, '4.720')] -[2023-10-17 12:41:52,867][113622] Saving new best policy, reward=4.060! -[2023-10-17 12:41:52,868][113701] Saving new best policy, reward=4.720! -[2023-10-17 12:41:53,504][112888] Keyboard interrupt detected in the event loop EvtLoop [Runner_EvtLoop, process=main process 112888], exiting... -[2023-10-17 12:41:53,505][113930] Stopping RolloutWorker_w7... -[2023-10-17 12:41:53,505][113925] Stopping RolloutWorker_w5... -[2023-10-17 12:41:53,506][113930] Loop rollout_proc7_evt_loop terminating... -[2023-10-17 12:41:53,506][113925] Loop rollout_proc5_evt_loop terminating... -[2023-10-17 12:41:53,506][114609] Stopping RolloutWorker_w15... -[2023-10-17 12:41:53,505][112888] Runner profile tree view: -main_loop: 56.1012 -[2023-10-17 12:41:53,506][114609] Loop rollout_proc15_evt_loop terminating... -[2023-10-17 12:41:53,506][112888] Collected {0: 114688, 1: 114688}, FPS: 4088.6 -[2023-10-17 12:41:53,506][113622] Stopping Batcher_0... -[2023-10-17 12:41:53,507][113931] Stopping RolloutWorker_w11... -[2023-10-17 12:41:53,507][113622] Loop batcher_evt_loop terminating... -[2023-10-17 12:41:53,507][113931] Loop rollout_proc11_evt_loop terminating... -[2023-10-17 12:41:53,508][113923] Stopping RolloutWorker_w1... -[2023-10-17 12:41:53,508][113622] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000000448_114688.pth... -[2023-10-17 12:41:53,508][113923] Loop rollout_proc1_evt_loop terminating... -[2023-10-17 12:41:53,510][113934] Stopping RolloutWorker_w12... -[2023-10-17 12:41:53,510][113934] Loop rollout_proc12_evt_loop terminating... -[2023-10-17 12:41:53,511][113929] Stopping RolloutWorker_w4... -[2023-10-17 12:41:53,511][113928] Stopping RolloutWorker_w9... -[2023-10-17 12:41:53,511][113933] Stopping RolloutWorker_w13... -[2023-10-17 12:41:53,511][113929] Loop rollout_proc4_evt_loop terminating... -[2023-10-17 12:41:53,511][113928] Loop rollout_proc9_evt_loop terminating... -[2023-10-17 12:41:53,511][113933] Loop rollout_proc13_evt_loop terminating... -[2023-10-17 12:41:53,513][113932] Stopping RolloutWorker_w10... -[2023-10-17 12:41:53,513][114575] Stopping RolloutWorker_w14... -[2023-10-17 12:41:53,513][113932] Loop rollout_proc10_evt_loop terminating... -[2023-10-17 12:41:53,514][114575] Loop rollout_proc14_evt_loop terminating... -[2023-10-17 12:41:53,514][113924] Stopping RolloutWorker_w3... -[2023-10-17 12:41:53,515][113924] Loop rollout_proc3_evt_loop terminating... -[2023-10-17 12:41:53,515][113927] Stopping RolloutWorker_w8... -[2023-10-17 12:41:53,516][113927] Loop rollout_proc8_evt_loop terminating... -[2023-10-17 12:41:53,519][113922] Stopping RolloutWorker_w2... -[2023-10-17 12:41:53,519][113926] Stopping RolloutWorker_w6... -[2023-10-17 12:41:53,519][113922] Loop rollout_proc2_evt_loop terminating... -[2023-10-17 12:41:53,519][113926] Loop rollout_proc6_evt_loop terminating... -[2023-10-17 12:41:53,526][113920] Stopping RolloutWorker_w0... -[2023-10-17 12:41:53,527][113920] Loop rollout_proc0_evt_loop terminating... -[2023-10-17 12:41:53,531][113887] Weights refcount: 2 0 -[2023-10-17 12:41:53,533][113887] Stopping InferenceWorker_p0-w0... -[2023-10-17 12:41:53,533][113887] Loop inference_proc0-0_evt_loop terminating... -[2023-10-17 12:41:53,544][113888] Weights refcount: 2 0 -[2023-10-17 12:41:53,546][113888] Stopping InferenceWorker_p1-w0... -[2023-10-17 12:41:53,546][113888] Loop inference_proc1-0_evt_loop terminating... -[2023-10-17 12:41:53,555][113622] Stopping LearnerWorker_p0... -[2023-10-17 12:41:53,555][113622] Loop learner_proc0_evt_loop terminating... -[2023-10-17 12:41:53,570][113701] Stopping Batcher_1... -[2023-10-17 12:41:53,570][113701] Loop batcher_evt_loop terminating... -[2023-10-17 12:41:54,659][113701] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000000480_122880.pth... -[2023-10-17 12:41:54,685][113701] Stopping LearnerWorker_p1... -[2023-10-17 12:41:54,685][113701] Loop learner_proc1_evt_loop terminating... -[2023-10-17 13:26:16,112][125151] Saving configuration to ./train_atari/atari_asteroid_APPO/config.json... -[2023-10-17 13:26:16,442][125151] Rollout worker 0 uses device cpu -[2023-10-17 13:26:16,442][125151] Rollout worker 1 uses device cpu -[2023-10-17 13:26:16,443][125151] Rollout worker 2 uses device cpu -[2023-10-17 13:26:16,443][125151] Rollout worker 3 uses device cpu -[2023-10-17 13:26:16,444][125151] Rollout worker 4 uses device cpu -[2023-10-17 13:26:16,444][125151] Rollout worker 5 uses device cpu -[2023-10-17 13:26:16,444][125151] Rollout worker 6 uses device cpu -[2023-10-17 13:26:16,445][125151] Rollout worker 7 uses device cpu -[2023-10-17 13:26:16,445][125151] Rollout worker 8 uses device cpu -[2023-10-17 13:26:16,446][125151] Rollout worker 9 uses device cpu -[2023-10-17 13:26:16,446][125151] Rollout worker 10 uses device cpu -[2023-10-17 13:26:16,446][125151] Rollout worker 11 uses device cpu -[2023-10-17 13:26:16,447][125151] Rollout worker 12 uses device cpu -[2023-10-17 13:26:16,447][125151] Rollout worker 13 uses device cpu -[2023-10-17 13:26:16,447][125151] Rollout worker 14 uses device cpu -[2023-10-17 13:26:16,448][125151] Rollout worker 15 uses device cpu -[2023-10-17 13:26:16,739][125151] Using GPUs [0] for process 0 (actually maps to GPUs [0]) -[2023-10-17 13:26:16,739][125151] InferenceWorker_p0-w0: min num requests: 2 -[2023-10-17 13:26:16,743][125151] Using GPUs [1] for process 1 (actually maps to GPUs [1]) -[2023-10-17 13:26:16,743][125151] InferenceWorker_p1-w0: min num requests: 2 -[2023-10-17 13:26:16,798][125151] Starting all processes... -[2023-10-17 13:26:16,798][125151] Starting process learner_proc0 -[2023-10-17 13:26:18,461][125151] Starting process learner_proc1 -[2023-10-17 13:26:18,464][125686] Using GPUs [0] for process 0 (actually maps to GPUs [0]) -[2023-10-17 13:26:18,464][125686] Set environment var CUDA_VISIBLE_DEVICES to '0' (GPU indices [0]) for learning process 0 -[2023-10-17 13:26:18,483][125686] Num visible devices: 1 -[2023-10-17 13:26:18,501][125686] Setting fixed seed 1234 -[2023-10-17 13:26:18,502][125686] Using GPUs [0] for process 0 (actually maps to GPUs [0]) -[2023-10-17 13:26:18,502][125686] Initializing actor-critic model on device cuda:0 -[2023-10-17 13:26:18,502][125686] RunningMeanStd input shape: (4, 84, 84) -[2023-10-17 13:26:18,503][125686] RunningMeanStd input shape: (1,) -[2023-10-17 13:26:18,514][125686] ConvEncoder: input_channels=4 -[2023-10-17 13:26:18,683][125686] Conv encoder output size: 512 -[2023-10-17 13:26:18,685][125686] Created Actor Critic model with architecture: -[2023-10-17 13:26:18,685][125686] ActorCriticSharedWeights( - (obs_normalizer): ObservationNormalizer( - (running_mean_std): RunningMeanStdDictInPlace( - (running_mean_std): ModuleDict( - (obs): RunningMeanStdInPlace() - ) - ) - ) - (returns_normalizer): RecursiveScriptModule(original_name=RunningMeanStdInPlace) - (encoder): MultiInputEncoder( - (encoders): ModuleDict( - (obs): ConvEncoder( - (enc): RecursiveScriptModule( - original_name=ConvEncoderImpl - (conv_head): RecursiveScriptModule( - original_name=Sequential - (0): RecursiveScriptModule(original_name=Conv2d) - (1): RecursiveScriptModule(original_name=ReLU) - (2): RecursiveScriptModule(original_name=Conv2d) - (3): RecursiveScriptModule(original_name=ReLU) - (4): RecursiveScriptModule(original_name=Conv2d) - (5): RecursiveScriptModule(original_name=ReLU) - ) - (mlp_layers): RecursiveScriptModule( - original_name=Sequential - (0): RecursiveScriptModule(original_name=Linear) - (1): RecursiveScriptModule(original_name=ReLU) - ) - ) - ) - ) - ) - (core): ModelCoreIdentity() - (decoder): MlpDecoder( - (mlp): Identity() - ) - (critic_linear): Linear(in_features=512, out_features=1, bias=True) - (action_parameterization): ActionParameterizationDefault( - (distribution_linear): Linear(in_features=512, out_features=14, bias=True) - ) -) -[2023-10-17 13:26:19,281][125686] Using optimizer -[2023-10-17 13:26:19,281][125686] Loading state from checkpoint ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000000448_114688.pth... -[2023-10-17 13:26:19,302][125686] Loading model from checkpoint -[2023-10-17 13:26:19,305][125686] Loaded experiment state at self.train_step=448, self.env_steps=114688 -[2023-10-17 13:26:19,305][125686] Initialized policy 0 weights for model version 448 -[2023-10-17 13:26:19,307][125686] LearnerWorker_p0 finished initialization! -[2023-10-17 13:26:19,308][125686] Using GPUs [0] for process 0 (actually maps to GPUs [0]) -[2023-10-17 13:26:20,194][125151] Starting all processes... -[2023-10-17 13:26:20,197][125846] Using GPUs [1] for process 1 (actually maps to GPUs [1]) -[2023-10-17 13:26:20,197][125846] Set environment var CUDA_VISIBLE_DEVICES to '1' (GPU indices [1]) for learning process 1 -[2023-10-17 13:26:20,203][125151] Starting process inference_proc0-0 -[2023-10-17 13:26:20,203][125151] Starting process inference_proc1-0 -[2023-10-17 13:26:20,215][125846] Num visible devices: 1 -[2023-10-17 13:26:20,203][125151] Starting process rollout_proc0 -[2023-10-17 13:26:20,204][125151] Starting process rollout_proc1 -[2023-10-17 13:26:20,204][125151] Starting process rollout_proc2 -[2023-10-17 13:26:20,204][125151] Starting process rollout_proc3 -[2023-10-17 13:26:20,205][125151] Starting process rollout_proc4 -[2023-10-17 13:26:20,233][125846] Setting fixed seed 1234 -[2023-10-17 13:26:20,234][125846] Using GPUs [0] for process 1 (actually maps to GPUs [1]) -[2023-10-17 13:26:20,235][125846] Initializing actor-critic model on device cuda:0 -[2023-10-17 13:26:20,235][125846] RunningMeanStd input shape: (4, 84, 84) -[2023-10-17 13:26:20,235][125846] RunningMeanStd input shape: (1,) -[2023-10-17 13:26:20,209][125151] Starting process rollout_proc5 -[2023-10-17 13:26:20,210][125151] Starting process rollout_proc6 -[2023-10-17 13:26:20,213][125151] Starting process rollout_proc7 -[2023-10-17 13:26:20,215][125151] Starting process rollout_proc8 -[2023-10-17 13:26:20,216][125151] Starting process rollout_proc9 -[2023-10-17 13:26:20,248][125846] ConvEncoder: input_channels=4 -[2023-10-17 13:26:20,217][125151] Starting process rollout_proc10 -[2023-10-17 13:26:20,217][125151] Starting process rollout_proc11 -[2023-10-17 13:26:20,217][125151] Starting process rollout_proc12 -[2023-10-17 13:26:20,218][125151] Starting process rollout_proc13 -[2023-10-17 13:26:20,608][125846] Conv encoder output size: 512 -[2023-10-17 13:26:20,610][125846] Created Actor Critic model with architecture: -[2023-10-17 13:26:20,611][125846] ActorCriticSharedWeights( - (obs_normalizer): ObservationNormalizer( - (running_mean_std): RunningMeanStdDictInPlace( - (running_mean_std): ModuleDict( - (obs): RunningMeanStdInPlace() - ) - ) - ) - (returns_normalizer): RecursiveScriptModule(original_name=RunningMeanStdInPlace) - (encoder): MultiInputEncoder( - (encoders): ModuleDict( - (obs): ConvEncoder( - (enc): RecursiveScriptModule( - original_name=ConvEncoderImpl - (conv_head): RecursiveScriptModule( - original_name=Sequential - (0): RecursiveScriptModule(original_name=Conv2d) - (1): RecursiveScriptModule(original_name=ReLU) - (2): RecursiveScriptModule(original_name=Conv2d) - (3): RecursiveScriptModule(original_name=ReLU) - (4): RecursiveScriptModule(original_name=Conv2d) - (5): RecursiveScriptModule(original_name=ReLU) - ) - (mlp_layers): RecursiveScriptModule( - original_name=Sequential - (0): RecursiveScriptModule(original_name=Linear) - (1): RecursiveScriptModule(original_name=ReLU) - ) - ) - ) - ) - ) - (core): ModelCoreIdentity() - (decoder): MlpDecoder( - (mlp): Identity() - ) - (critic_linear): Linear(in_features=512, out_features=1, bias=True) - (action_parameterization): ActionParameterizationDefault( - (distribution_linear): Linear(in_features=512, out_features=14, bias=True) - ) -) -[2023-10-17 13:26:21,316][125846] Using optimizer -[2023-10-17 13:26:21,316][125846] Loading state from checkpoint ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000000480_122880.pth... -[2023-10-17 13:26:21,335][125846] Loading model from checkpoint -[2023-10-17 13:26:21,338][125846] Loaded experiment state at self.train_step=480, self.env_steps=122880 -[2023-10-17 13:26:21,338][125846] Initialized policy 1 weights for model version 480 -[2023-10-17 13:26:21,340][125846] LearnerWorker_p1 finished initialization! -[2023-10-17 13:26:21,340][125846] Using GPUs [0] for process 1 (actually maps to GPUs [1]) -[2023-10-17 13:26:22,459][125151] Starting process rollout_proc14 -[2023-10-17 13:26:22,466][126041] Worker 4 uses CPU cores [8, 9] -[2023-10-17 13:26:22,491][125151] Starting process rollout_proc15 -[2023-10-17 13:26:22,495][126043] Worker 2 uses CPU cores [4, 5] -[2023-10-17 13:26:22,518][126039] Worker 1 uses CPU cores [2, 3] -[2023-10-17 13:26:22,558][126051] Worker 12 uses CPU cores [24, 25] -[2023-10-17 13:26:22,790][126048] Worker 9 uses CPU cores [18, 19] -[2023-10-17 13:26:22,819][126049] Worker 11 uses CPU cores [22, 23] -[2023-10-17 13:26:22,840][126042] Worker 5 uses CPU cores [10, 11] -[2023-10-17 13:26:22,846][126050] Worker 13 uses CPU cores [26, 27] -[2023-10-17 13:26:22,881][126045] Worker 7 uses CPU cores [14, 15] -[2023-10-17 13:26:22,894][126044] Worker 6 uses CPU cores [12, 13] -[2023-10-17 13:26:22,979][126037] Worker 0 uses CPU cores [0, 1] -[2023-10-17 13:26:22,994][126047] Worker 10 uses CPU cores [20, 21] -[2023-10-17 13:26:23,034][126040] Worker 3 uses CPU cores [6, 7] -[2023-10-17 13:26:23,066][126046] Worker 8 uses CPU cores [16, 17] -[2023-10-17 13:26:23,164][126004] Using GPUs [0] for process 0 (actually maps to GPUs [0]) -[2023-10-17 13:26:23,164][126004] Set environment var CUDA_VISIBLE_DEVICES to '0' (GPU indices [0]) for inference process 0 -[2023-10-17 13:26:23,179][126005] Using GPUs [1] for process 1 (actually maps to GPUs [1]) -[2023-10-17 13:26:23,179][126005] Set environment var CUDA_VISIBLE_DEVICES to '1' (GPU indices [1]) for inference process 1 -[2023-10-17 13:26:23,183][126004] Num visible devices: 1 -[2023-10-17 13:26:23,198][126005] Num visible devices: 1 -[2023-10-17 13:26:23,834][126004] RunningMeanStd input shape: (4, 84, 84) -[2023-10-17 13:26:23,835][126004] RunningMeanStd input shape: (1,) -[2023-10-17 13:26:23,844][126005] RunningMeanStd input shape: (4, 84, 84) -[2023-10-17 13:26:23,844][126005] RunningMeanStd input shape: (1,) -[2023-10-17 13:26:23,846][126004] ConvEncoder: input_channels=4 -[2023-10-17 13:26:23,856][126005] ConvEncoder: input_channels=4 -[2023-10-17 13:26:23,952][126004] Conv encoder output size: 512 -[2023-10-17 13:26:23,956][126005] Conv encoder output size: 512 -[2023-10-17 13:26:24,420][126637] Worker 14 uses CPU cores [28, 29] -[2023-10-17 13:26:24,475][125151] Inference worker 0-0 is ready! -[2023-10-17 13:26:24,476][126669] Worker 15 uses CPU cores [30, 31] -[2023-10-17 13:26:24,476][125151] Inference worker 1-0 is ready! -[2023-10-17 13:26:24,477][125151] All inference workers are ready! Signal rollout workers to start! -[2023-10-17 13:26:24,478][126044] EnvRunner 6-0 uses policy 0 -[2023-10-17 13:26:24,478][126047] EnvRunner 10-0 uses policy 0 -[2023-10-17 13:26:24,478][126043] EnvRunner 2-0 uses policy 0 -[2023-10-17 13:26:24,478][126040] EnvRunner 3-0 uses policy 1 -[2023-10-17 13:26:24,478][126048] EnvRunner 9-0 uses policy 1 -[2023-10-17 13:26:24,478][126046] EnvRunner 8-0 uses policy 0 -[2023-10-17 13:26:24,478][126039] EnvRunner 1-0 uses policy 1 -[2023-10-17 13:26:24,478][126037] EnvRunner 0-0 uses policy 0 -[2023-10-17 13:26:24,478][126049] EnvRunner 11-0 uses policy 1 -[2023-10-17 13:26:24,478][126050] EnvRunner 13-0 uses policy 1 -[2023-10-17 13:26:24,478][126045] EnvRunner 7-0 uses policy 1 -[2023-10-17 13:26:24,478][126051] EnvRunner 12-0 uses policy 0 -[2023-10-17 13:26:24,478][126042] EnvRunner 5-0 uses policy 1 -[2023-10-17 13:26:24,478][125151] Fps is (10 sec: nan, 60 sec: nan, 300 sec: nan). Total num frames: 237568. Throughput: 0: nan, 1: nan. Samples: 0. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-10-17 13:26:24,478][126041] EnvRunner 4-0 uses policy 0 -[2023-10-17 13:26:24,567][126669] EnvRunner 15-0 uses policy 1 -[2023-10-17 13:26:24,631][126637] EnvRunner 14-0 uses policy 0 -[2023-10-17 13:26:26,109][126047] EnvRunner 10-1 uses policy 0 -[2023-10-17 13:26:26,128][126043] EnvRunner 2-1 uses policy 0 -[2023-10-17 13:26:26,138][126045] EnvRunner 7-1 uses policy 1 -[2023-10-17 13:26:26,162][126044] EnvRunner 6-1 uses policy 0 -[2023-10-17 13:26:26,170][126051] EnvRunner 12-1 uses policy 0 -[2023-10-17 13:26:26,184][126041] EnvRunner 4-1 uses policy 0 -[2023-10-17 13:26:26,186][126037] EnvRunner 0-1 uses policy 0 -[2023-10-17 13:26:26,208][126039] EnvRunner 1-1 uses policy 1 -[2023-10-17 13:26:26,218][126669] EnvRunner 15-1 uses policy 1 -[2023-10-17 13:26:26,297][126637] EnvRunner 14-1 uses policy 0 -[2023-10-17 13:26:26,385][126048] EnvRunner 9-1 uses policy 1 -[2023-10-17 13:26:26,437][126046] EnvRunner 8-1 uses policy 0 -[2023-10-17 13:26:26,725][125151] Heartbeat connected on Batcher_0 -[2023-10-17 13:26:26,729][125151] Heartbeat connected on LearnerWorker_p0 -[2023-10-17 13:26:26,732][125151] Heartbeat connected on Batcher_1 -[2023-10-17 13:26:26,734][125151] Heartbeat connected on LearnerWorker_p1 -[2023-10-17 13:26:26,768][125151] Heartbeat connected on InferenceWorker_p0-w0 -[2023-10-17 13:26:26,785][125151] Heartbeat connected on InferenceWorker_p1-w0 -[2023-10-17 13:26:27,238][125151] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 237568. Throughput: 0: 0.0, 1: 0.0. Samples: 0. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-10-17 13:26:27,487][126042] EnvRunner 5-1 uses policy 1 -[2023-10-17 13:26:27,493][126050] EnvRunner 13-1 uses policy 1 -[2023-10-17 13:26:27,495][126040] EnvRunner 3-1 uses policy 1 -[2023-10-17 13:26:27,521][126049] EnvRunner 11-1 uses policy 1 -[2023-10-17 13:26:27,690][125151] Heartbeat connected on RolloutWorker_w10 -[2023-10-17 13:26:27,707][125151] Heartbeat connected on RolloutWorker_w2 -[2023-10-17 13:26:27,730][125151] Heartbeat connected on RolloutWorker_w7 -[2023-10-17 13:26:27,754][125151] Heartbeat connected on RolloutWorker_w6 -[2023-10-17 13:26:27,767][125151] Heartbeat connected on RolloutWorker_w4 -[2023-10-17 13:26:27,768][125151] Heartbeat connected on RolloutWorker_w12 -[2023-10-17 13:26:27,787][125151] Heartbeat connected on RolloutWorker_w0 -[2023-10-17 13:26:27,823][125151] Heartbeat connected on RolloutWorker_w15 -[2023-10-17 13:26:27,876][125151] Heartbeat connected on RolloutWorker_w1 -[2023-10-17 13:26:27,925][125151] Heartbeat connected on RolloutWorker_w14 -[2023-10-17 13:26:28,218][125151] Heartbeat connected on RolloutWorker_w9 -[2023-10-17 13:26:28,270][125151] Heartbeat connected on RolloutWorker_w8 -[2023-10-17 13:26:29,372][125151] Heartbeat connected on RolloutWorker_w3 -[2023-10-17 13:26:29,392][125151] Heartbeat connected on RolloutWorker_w11 -[2023-10-17 13:26:30,409][125151] Heartbeat connected on RolloutWorker_w5 -[2023-10-17 13:26:30,423][125151] Heartbeat connected on RolloutWorker_w13 -[2023-10-17 13:26:32,238][125151] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 237568. Throughput: 0: 821.7, 1: 463.4. Samples: 9972. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-10-17 13:26:32,239][125151] Avg episode reward: [(0, '2.641'), (1, '2.763')] -[2023-10-17 13:26:34,376][125686] Signal inference workers to stop experience collection... -[2023-10-17 13:26:34,385][126004] InferenceWorker_p0-w0: stopping experience collection -[2023-10-17 13:26:34,414][126005] InferenceWorker_p1-w0: stopping experience collection -[2023-10-17 13:26:36,126][125686] Signal inference workers to resume experience collection... -[2023-10-17 13:26:36,127][126005] InferenceWorker_p1-w0: resuming experience collection -[2023-10-17 13:26:36,127][126004] InferenceWorker_p0-w0: resuming experience collection -[2023-10-17 13:26:36,901][125846] Signal inference workers to stop experience collection... -[2023-10-17 13:26:37,238][125151] Fps is (10 sec: 819.2, 60 sec: 642.0, 300 sec: 642.0). Total num frames: 245760. Throughput: 0: 1635.1, 1: 1318.2. Samples: 37684. Policy #0 lag: (min: 21.0, avg: 21.0, max: 21.0) -[2023-10-17 13:26:37,239][125151] Avg episode reward: [(0, '3.100'), (1, '3.390')] -[2023-10-17 13:26:37,673][125846] Signal inference workers to resume experience collection... -[2023-10-17 13:26:37,968][126004] Updated weights for policy 0, policy_version 500 (0.0585) -[2023-10-17 13:26:38,348][126004] Updated weights for policy 0, policy_version 510 (0.0011) -[2023-10-17 13:26:38,980][126005] Updated weights for policy 1, policy_version 514 (0.0375) -[2023-10-17 13:26:39,445][126005] Updated weights for policy 1, policy_version 526 (0.0007) -[2023-10-17 13:26:39,818][126005] Updated weights for policy 1, policy_version 536 (0.0008) -[2023-10-17 13:26:40,593][126004] Updated weights for policy 0, policy_version 520 (0.0009) -[2023-10-17 13:26:40,958][126004] Updated weights for policy 0, policy_version 530 (0.0007) -[2023-10-17 13:26:41,350][126004] Updated weights for policy 0, policy_version 540 (0.0007) -[2023-10-17 13:26:41,469][126005] Updated weights for policy 1, policy_version 546 (0.0007) -[2023-10-17 13:26:41,862][126005] Updated weights for policy 1, policy_version 556 (0.0010) -[2023-10-17 13:26:42,231][126005] Updated weights for policy 1, policy_version 566 (0.0007) -[2023-10-17 13:26:42,238][125151] Fps is (10 sec: 4096.0, 60 sec: 2306.3, 300 sec: 2306.3). Total num frames: 278528. Throughput: 0: 1910.8, 1: 1690.8. Samples: 63964. Policy #0 lag: (min: 31.0, avg: 59.1, max: 95.0) -[2023-10-17 13:26:42,239][125151] Avg episode reward: [(0, '4.280'), (1, '4.170')] -[2023-10-17 13:26:42,245][125686] Saving new best policy, reward=4.280! -[2023-10-17 13:26:42,625][126005] Updated weights for policy 1, policy_version 576 (0.0009) -[2023-10-17 13:26:43,184][126004] Updated weights for policy 0, policy_version 550 (0.0007) -[2023-10-17 13:26:43,556][126004] Updated weights for policy 0, policy_version 560 (0.0007) -[2023-10-17 13:26:43,935][126004] Updated weights for policy 0, policy_version 570 (0.0007) -[2023-10-17 13:26:44,403][126005] Updated weights for policy 1, policy_version 586 (0.0007) -[2023-10-17 13:26:44,783][126005] Updated weights for policy 1, policy_version 596 (0.0007) -[2023-10-17 13:26:45,173][126005] Updated weights for policy 1, policy_version 606 (0.0007) -[2023-10-17 13:26:45,792][126004] Updated weights for policy 0, policy_version 580 (0.0009) -[2023-10-17 13:26:46,171][126004] Updated weights for policy 0, policy_version 590 (0.0011) -[2023-10-17 13:26:46,548][126004] Updated weights for policy 0, policy_version 600 (0.0011) -[2023-10-17 13:26:46,836][126005] Updated weights for policy 1, policy_version 616 (0.0008) -[2023-10-17 13:26:47,208][126005] Updated weights for policy 1, policy_version 626 (0.0010) -[2023-10-17 13:26:47,238][125151] Fps is (10 sec: 6553.6, 60 sec: 3239.4, 300 sec: 3239.4). Total num frames: 311296. Throughput: 0: 1885.2, 1: 1694.6. Samples: 81476. Policy #0 lag: (min: 31.0, avg: 33.8, max: 51.0) -[2023-10-17 13:26:47,239][125151] Avg episode reward: [(0, '4.650'), (1, '4.000')] -[2023-10-17 13:26:47,241][125686] Saving new best policy, reward=4.650! -[2023-10-17 13:26:47,587][126005] Updated weights for policy 1, policy_version 636 (0.0007) -[2023-10-17 13:26:48,360][126004] Updated weights for policy 0, policy_version 610 (0.0010) -[2023-10-17 13:26:48,734][126004] Updated weights for policy 0, policy_version 620 (0.0007) -[2023-10-17 13:26:49,115][126004] Updated weights for policy 0, policy_version 630 (0.0010) -[2023-10-17 13:26:49,504][126004] Updated weights for policy 0, policy_version 640 (0.0007) -[2023-10-17 13:26:50,019][126005] Updated weights for policy 1, policy_version 648 (0.0007) -[2023-10-17 13:26:50,401][126005] Updated weights for policy 1, policy_version 658 (0.0012) -[2023-10-17 13:26:50,785][126005] Updated weights for policy 1, policy_version 668 (0.0011) -[2023-10-17 13:26:51,350][126004] Updated weights for policy 0, policy_version 650 (0.0010) -[2023-10-17 13:26:51,729][126004] Updated weights for policy 0, policy_version 660 (0.0012) -[2023-10-17 13:26:52,110][126004] Updated weights for policy 0, policy_version 670 (0.0012) -[2023-10-17 13:26:52,238][125151] Fps is (10 sec: 6553.6, 60 sec: 3836.3, 300 sec: 3836.3). Total num frames: 344064. Throughput: 0: 2220.9, 1: 2039.9. Samples: 118280. Policy #0 lag: (min: 31.0, avg: 34.4, max: 55.0) -[2023-10-17 13:26:52,239][125151] Avg episode reward: [(0, '3.930'), (1, '4.360')] -[2023-10-17 13:26:52,514][126005] Updated weights for policy 1, policy_version 678 (0.0009) -[2023-10-17 13:26:52,896][126005] Updated weights for policy 1, policy_version 688 (0.0007) -[2023-10-17 13:26:53,270][126005] Updated weights for policy 1, policy_version 698 (0.0008) -[2023-10-17 13:26:53,934][126004] Updated weights for policy 0, policy_version 680 (0.0010) -[2023-10-17 13:26:54,322][126004] Updated weights for policy 0, policy_version 690 (0.0011) -[2023-10-17 13:26:54,708][126004] Updated weights for policy 0, policy_version 700 (0.0011) -[2023-10-17 13:26:54,722][126005] Updated weights for policy 1, policy_version 708 (0.0008) -[2023-10-17 13:26:55,107][126005] Updated weights for policy 1, policy_version 718 (0.0007) -[2023-10-17 13:26:55,490][126005] Updated weights for policy 1, policy_version 728 (0.0009) -[2023-10-17 13:26:56,982][126004] Updated weights for policy 0, policy_version 710 (0.0011) -[2023-10-17 13:26:57,167][126005] Updated weights for policy 1, policy_version 738 (0.0008) -[2023-10-17 13:26:57,238][125151] Fps is (10 sec: 5734.4, 60 sec: 4001.0, 300 sec: 4001.0). Total num frames: 368640. Throughput: 0: 2409.3, 1: 2353.1. Samples: 156016. Policy #0 lag: (min: 31.0, avg: 34.4, max: 55.0) -[2023-10-17 13:26:57,239][125151] Avg episode reward: [(0, '3.870'), (1, '4.710')] -[2023-10-17 13:26:57,365][126004] Updated weights for policy 0, policy_version 720 (0.0007) -[2023-10-17 13:26:57,548][126005] Updated weights for policy 1, policy_version 748 (0.0007) -[2023-10-17 13:26:57,737][126004] Updated weights for policy 0, policy_version 730 (0.0008) -[2023-10-17 13:26:57,913][126005] Updated weights for policy 1, policy_version 758 (0.0010) -[2023-10-17 13:26:58,302][126005] Updated weights for policy 1, policy_version 768 (0.0007) -[2023-10-17 13:26:59,653][126004] Updated weights for policy 0, policy_version 740 (0.0009) -[2023-10-17 13:27:00,029][126004] Updated weights for policy 0, policy_version 750 (0.0011) -[2023-10-17 13:27:00,136][126005] Updated weights for policy 1, policy_version 778 (0.0008) -[2023-10-17 13:27:00,406][126004] Updated weights for policy 0, policy_version 760 (0.0011) -[2023-10-17 13:27:00,518][126005] Updated weights for policy 1, policy_version 788 (0.0007) -[2023-10-17 13:27:00,894][126005] Updated weights for policy 1, policy_version 798 (0.0010) -[2023-10-17 13:27:02,155][126004] Updated weights for policy 0, policy_version 770 (0.0010) -[2023-10-17 13:27:02,238][125151] Fps is (10 sec: 5734.4, 60 sec: 4339.0, 300 sec: 4339.0). Total num frames: 401408. Throughput: 0: 2319.4, 1: 2294.1. Samples: 174204. Policy #0 lag: (min: 31.0, avg: 35.7, max: 63.0) -[2023-10-17 13:27:02,239][125151] Avg episode reward: [(0, '4.830'), (1, '5.140')] -[2023-10-17 13:27:02,241][125846] Saving new best policy, reward=5.140! -[2023-10-17 13:27:02,532][126004] Updated weights for policy 0, policy_version 780 (0.0010) -[2023-10-17 13:27:02,702][126005] Updated weights for policy 1, policy_version 808 (0.0012) -[2023-10-17 13:27:02,909][126004] Updated weights for policy 0, policy_version 790 (0.0009) -[2023-10-17 13:27:03,080][126005] Updated weights for policy 1, policy_version 818 (0.0011) -[2023-10-17 13:27:03,287][126004] Updated weights for policy 0, policy_version 800 (0.0010) -[2023-10-17 13:27:03,288][125686] Saving new best policy, reward=4.830! -[2023-10-17 13:27:03,460][126005] Updated weights for policy 1, policy_version 828 (0.0011) -[2023-10-17 13:27:05,004][126004] Updated weights for policy 0, policy_version 810 (0.0007) -[2023-10-17 13:27:05,039][126005] Updated weights for policy 1, policy_version 838 (0.0011) -[2023-10-17 13:27:05,386][126004] Updated weights for policy 0, policy_version 820 (0.0007) -[2023-10-17 13:27:05,419][126005] Updated weights for policy 1, policy_version 848 (0.0010) -[2023-10-17 13:27:05,773][126004] Updated weights for policy 0, policy_version 830 (0.0007) -[2023-10-17 13:27:05,798][126005] Updated weights for policy 1, policy_version 858 (0.0011) -[2023-10-17 13:27:07,238][125151] Fps is (10 sec: 6553.8, 60 sec: 4598.0, 300 sec: 4598.0). Total num frames: 434176. Throughput: 0: 2490.8, 1: 2462.3. Samples: 211796. Policy #0 lag: (min: 26.0, avg: 53.1, max: 71.0) -[2023-10-17 13:27:07,239][125151] Avg episode reward: [(0, '4.720'), (1, '4.660')] -[2023-10-17 13:27:07,650][126004] Updated weights for policy 0, policy_version 840 (0.0007) -[2023-10-17 13:27:08,037][126004] Updated weights for policy 0, policy_version 850 (0.0008) -[2023-10-17 13:27:08,057][126005] Updated weights for policy 1, policy_version 868 (0.0011) -[2023-10-17 13:27:08,422][126004] Updated weights for policy 0, policy_version 860 (0.0011) -[2023-10-17 13:27:08,429][126005] Updated weights for policy 1, policy_version 878 (0.0011) -[2023-10-17 13:27:08,800][126005] Updated weights for policy 1, policy_version 888 (0.0011) -[2023-10-17 13:27:10,364][126004] Updated weights for policy 0, policy_version 870 (0.0011) -[2023-10-17 13:27:10,735][126004] Updated weights for policy 0, policy_version 880 (0.0008) -[2023-10-17 13:27:10,811][126005] Updated weights for policy 1, policy_version 900 (0.0026) -[2023-10-17 13:27:11,128][126004] Updated weights for policy 0, policy_version 890 (0.0008) -[2023-10-17 13:27:11,188][126005] Updated weights for policy 1, policy_version 910 (0.0012) -[2023-10-17 13:27:11,565][126005] Updated weights for policy 1, policy_version 920 (0.0012) -[2023-10-17 13:27:12,238][125151] Fps is (10 sec: 6553.5, 60 sec: 4802.7, 300 sec: 4802.7). Total num frames: 466944. Throughput: 0: 2787.9, 1: 2716.3. Samples: 247692. Policy #0 lag: (min: 22.0, avg: 30.7, max: 54.0) -[2023-10-17 13:27:12,239][125151] Avg episode reward: [(0, '4.320'), (1, '4.680')] -[2023-10-17 13:27:12,696][126004] Updated weights for policy 0, policy_version 900 (0.0009) -[2023-10-17 13:27:13,078][126004] Updated weights for policy 0, policy_version 910 (0.0011) -[2023-10-17 13:27:13,460][126004] Updated weights for policy 0, policy_version 920 (0.0011) -[2023-10-17 13:27:13,478][126005] Updated weights for policy 1, policy_version 930 (0.0012) -[2023-10-17 13:27:13,854][126005] Updated weights for policy 1, policy_version 940 (0.0012) -[2023-10-17 13:27:14,238][126005] Updated weights for policy 1, policy_version 950 (0.0011) -[2023-10-17 13:27:14,625][126005] Updated weights for policy 1, policy_version 960 (0.0007) -[2023-10-17 13:27:15,741][126004] Updated weights for policy 0, policy_version 930 (0.0012) -[2023-10-17 13:27:16,115][126004] Updated weights for policy 0, policy_version 940 (0.0012) -[2023-10-17 13:27:16,494][126004] Updated weights for policy 0, policy_version 950 (0.0011) -[2023-10-17 13:27:16,568][126005] Updated weights for policy 1, policy_version 970 (0.0008) -[2023-10-17 13:27:16,876][126004] Updated weights for policy 0, policy_version 960 (0.0010) -[2023-10-17 13:27:16,949][126005] Updated weights for policy 1, policy_version 980 (0.0007) -[2023-10-17 13:27:17,238][125151] Fps is (10 sec: 5734.4, 60 sec: 4813.4, 300 sec: 4813.4). Total num frames: 491520. Throughput: 0: 2840.4, 1: 2837.8. Samples: 265488. Policy #0 lag: (min: 30.0, avg: 60.3, max: 87.0) -[2023-10-17 13:27:17,239][125151] Avg episode reward: [(0, '4.310'), (1, '4.720')] -[2023-10-17 13:27:17,329][126005] Updated weights for policy 1, policy_version 990 (0.0007) -[2023-10-17 13:27:18,563][126004] Updated weights for policy 0, policy_version 970 (0.0007) -[2023-10-17 13:27:18,957][126004] Updated weights for policy 0, policy_version 980 (0.0008) -[2023-10-17 13:27:19,342][126004] Updated weights for policy 0, policy_version 990 (0.0011) -[2023-10-17 13:27:19,635][126005] Updated weights for policy 1, policy_version 1000 (0.0007) -[2023-10-17 13:27:20,015][126005] Updated weights for policy 1, policy_version 1010 (0.0007) -[2023-10-17 13:27:20,398][126005] Updated weights for policy 1, policy_version 1020 (0.0010) -[2023-10-17 13:27:20,808][126004] Updated weights for policy 0, policy_version 1002 (0.0029) -[2023-10-17 13:27:21,184][126004] Updated weights for policy 0, policy_version 1012 (0.0012) -[2023-10-17 13:27:21,564][126004] Updated weights for policy 0, policy_version 1022 (0.0012) -[2023-10-17 13:27:22,034][126005] Updated weights for policy 1, policy_version 1030 (0.0016) -[2023-10-17 13:27:22,238][125151] Fps is (10 sec: 5734.5, 60 sec: 4964.0, 300 sec: 4964.0). Total num frames: 524288. Throughput: 0: 2938.7, 1: 2922.0. Samples: 301416. Policy #0 lag: (min: 31.0, avg: 49.5, max: 63.0) -[2023-10-17 13:27:22,239][125151] Avg episode reward: [(0, '4.430'), (1, '4.970')] -[2023-10-17 13:27:22,409][126005] Updated weights for policy 1, policy_version 1040 (0.0012) -[2023-10-17 13:27:22,797][126005] Updated weights for policy 1, policy_version 1050 (0.0012) -[2023-10-17 13:27:23,122][126004] Updated weights for policy 0, policy_version 1032 (0.0009) -[2023-10-17 13:27:23,502][126004] Updated weights for policy 0, policy_version 1042 (0.0008) -[2023-10-17 13:27:23,897][126004] Updated weights for policy 0, policy_version 1052 (0.0007) -[2023-10-17 13:27:24,563][126005] Updated weights for policy 1, policy_version 1060 (0.0011) -[2023-10-17 13:27:24,954][126005] Updated weights for policy 1, policy_version 1070 (0.0008) -[2023-10-17 13:27:25,341][126005] Updated weights for policy 1, policy_version 1080 (0.0009) -[2023-10-17 13:27:25,985][126004] Updated weights for policy 0, policy_version 1062 (0.0007) -[2023-10-17 13:27:26,374][126004] Updated weights for policy 0, policy_version 1072 (0.0007) -[2023-10-17 13:27:26,757][126004] Updated weights for policy 0, policy_version 1082 (0.0007) -[2023-10-17 13:27:27,238][125151] Fps is (10 sec: 6553.7, 60 sec: 5324.8, 300 sec: 5090.7). Total num frames: 557056. Throughput: 0: 3022.5, 1: 3043.0. Samples: 336912. Policy #0 lag: (min: 28.0, avg: 47.6, max: 64.0) -[2023-10-17 13:27:27,238][125151] Avg episode reward: [(0, '4.560'), (1, '5.050')] -[2023-10-17 13:27:27,242][126005] Updated weights for policy 1, policy_version 1090 (0.0011) -[2023-10-17 13:27:27,625][126005] Updated weights for policy 1, policy_version 1100 (0.0011) -[2023-10-17 13:27:28,015][126005] Updated weights for policy 1, policy_version 1110 (0.0011) -[2023-10-17 13:27:28,398][126005] Updated weights for policy 1, policy_version 1120 (0.0011) -[2023-10-17 13:27:28,943][126004] Updated weights for policy 0, policy_version 1092 (0.0007) -[2023-10-17 13:27:29,334][126004] Updated weights for policy 0, policy_version 1102 (0.0007) -[2023-10-17 13:27:29,718][126004] Updated weights for policy 0, policy_version 1112 (0.0011) -[2023-10-17 13:27:30,506][126005] Updated weights for policy 1, policy_version 1130 (0.0010) -[2023-10-17 13:27:30,893][126005] Updated weights for policy 1, policy_version 1140 (0.0008) -[2023-10-17 13:27:31,270][126005] Updated weights for policy 1, policy_version 1150 (0.0007) -[2023-10-17 13:27:31,888][126004] Updated weights for policy 0, policy_version 1122 (0.0011) -[2023-10-17 13:27:32,238][125151] Fps is (10 sec: 5734.4, 60 sec: 5734.4, 300 sec: 5077.7). Total num frames: 581632. Throughput: 0: 2998.4, 1: 3065.1. Samples: 354332. Policy #0 lag: (min: 28.0, avg: 47.6, max: 64.0) -[2023-10-17 13:27:32,239][125151] Avg episode reward: [(0, '4.910'), (1, '5.080')] -[2023-10-17 13:27:32,273][126004] Updated weights for policy 0, policy_version 1132 (0.0011) -[2023-10-17 13:27:32,658][126004] Updated weights for policy 0, policy_version 1142 (0.0010) -[2023-10-17 13:27:33,037][126004] Updated weights for policy 0, policy_version 1152 (0.0007) -[2023-10-17 13:27:33,037][125686] Saving new best policy, reward=4.910! -[2023-10-17 13:27:33,247][126005] Updated weights for policy 1, policy_version 1160 (0.0008) -[2023-10-17 13:27:33,615][126005] Updated weights for policy 1, policy_version 1170 (0.0007) -[2023-10-17 13:27:33,995][126005] Updated weights for policy 1, policy_version 1180 (0.0007) -[2023-10-17 13:27:35,275][126004] Updated weights for policy 0, policy_version 1162 (0.0012) -[2023-10-17 13:27:35,665][126004] Updated weights for policy 0, policy_version 1172 (0.0012) -[2023-10-17 13:27:35,922][126005] Updated weights for policy 1, policy_version 1190 (0.0008) -[2023-10-17 13:27:36,031][126004] Updated weights for policy 0, policy_version 1182 (0.0010) -[2023-10-17 13:27:36,303][126005] Updated weights for policy 1, policy_version 1200 (0.0010) -[2023-10-17 13:27:36,685][126005] Updated weights for policy 1, policy_version 1210 (0.0011) -[2023-10-17 13:27:37,238][125151] Fps is (10 sec: 5734.4, 60 sec: 6144.0, 300 sec: 5179.1). Total num frames: 614400. Throughput: 0: 2931.6, 1: 3062.6. Samples: 388020. Policy #0 lag: (min: 15.0, avg: 28.1, max: 47.0) -[2023-10-17 13:27:37,239][125151] Avg episode reward: [(0, '4.810'), (1, '5.030')] -[2023-10-17 13:27:37,557][126004] Updated weights for policy 0, policy_version 1192 (0.0007) -[2023-10-17 13:27:37,942][126004] Updated weights for policy 0, policy_version 1202 (0.0007) -[2023-10-17 13:27:38,332][126004] Updated weights for policy 0, policy_version 1212 (0.0007) -[2023-10-17 13:27:38,676][126005] Updated weights for policy 1, policy_version 1220 (0.0012) -[2023-10-17 13:27:39,056][126005] Updated weights for policy 1, policy_version 1230 (0.0011) -[2023-10-17 13:27:39,429][126005] Updated weights for policy 1, policy_version 1240 (0.0012) -[2023-10-17 13:27:40,382][126004] Updated weights for policy 0, policy_version 1222 (0.0009) -[2023-10-17 13:27:40,768][126004] Updated weights for policy 0, policy_version 1232 (0.0011) -[2023-10-17 13:27:40,994][126005] Updated weights for policy 1, policy_version 1250 (0.0012) -[2023-10-17 13:27:41,155][126004] Updated weights for policy 0, policy_version 1242 (0.0011) -[2023-10-17 13:27:41,368][126005] Updated weights for policy 1, policy_version 1260 (0.0012) -[2023-10-17 13:27:41,749][126005] Updated weights for policy 1, policy_version 1270 (0.0012) -[2023-10-17 13:27:42,130][126005] Updated weights for policy 1, policy_version 1280 (0.0011) -[2023-10-17 13:27:42,238][125151] Fps is (10 sec: 6553.6, 60 sec: 6144.0, 300 sec: 5267.5). Total num frames: 647168. Throughput: 0: 2954.0, 1: 2983.6. Samples: 423204. Policy #0 lag: (min: 31.0, avg: 38.7, max: 63.0) -[2023-10-17 13:27:42,239][125151] Avg episode reward: [(0, '5.170'), (1, '5.420')] -[2023-10-17 13:27:42,251][125686] Saving new best policy, reward=5.170! -[2023-10-17 13:27:42,251][125846] Saving new best policy, reward=5.420! -[2023-10-17 13:27:43,417][126004] Updated weights for policy 0, policy_version 1252 (0.0008) -[2023-10-17 13:27:43,803][126004] Updated weights for policy 0, policy_version 1262 (0.0007) -[2023-10-17 13:27:44,184][126004] Updated weights for policy 0, policy_version 1272 (0.0007) -[2023-10-17 13:27:44,497][126005] Updated weights for policy 1, policy_version 1290 (0.0007) -[2023-10-17 13:27:44,896][126005] Updated weights for policy 1, policy_version 1300 (0.0007) -[2023-10-17 13:27:45,276][126005] Updated weights for policy 1, policy_version 1310 (0.0007) -[2023-10-17 13:27:46,392][126004] Updated weights for policy 0, policy_version 1282 (0.0008) -[2023-10-17 13:27:46,774][126004] Updated weights for policy 0, policy_version 1292 (0.0011) -[2023-10-17 13:27:47,039][126005] Updated weights for policy 1, policy_version 1320 (0.0009) -[2023-10-17 13:27:47,162][126004] Updated weights for policy 0, policy_version 1302 (0.0007) -[2023-10-17 13:27:47,238][125151] Fps is (10 sec: 4915.1, 60 sec: 5870.9, 300 sec: 5147.2). Total num frames: 663552. Throughput: 0: 2956.2, 1: 2969.3. Samples: 440852. Policy #0 lag: (min: 12.0, avg: 26.9, max: 44.0) -[2023-10-17 13:27:47,240][125151] Avg episode reward: [(0, '4.910'), (1, '4.650')] -[2023-10-17 13:27:47,416][126005] Updated weights for policy 1, policy_version 1330 (0.0011) -[2023-10-17 13:27:47,555][126004] Updated weights for policy 0, policy_version 1312 (0.0007) -[2023-10-17 13:27:47,795][126005] Updated weights for policy 1, policy_version 1340 (0.0012) -[2023-10-17 13:27:49,769][126004] Updated weights for policy 0, policy_version 1322 (0.0009) -[2023-10-17 13:27:49,930][126005] Updated weights for policy 1, policy_version 1350 (0.0009) -[2023-10-17 13:27:50,143][126004] Updated weights for policy 0, policy_version 1332 (0.0010) -[2023-10-17 13:27:50,317][126005] Updated weights for policy 1, policy_version 1360 (0.0008) -[2023-10-17 13:27:50,531][126004] Updated weights for policy 0, policy_version 1342 (0.0009) -[2023-10-17 13:27:50,692][126005] Updated weights for policy 1, policy_version 1370 (0.0010) -[2023-10-17 13:27:52,173][126004] Updated weights for policy 0, policy_version 1352 (0.0012) -[2023-10-17 13:27:52,238][125151] Fps is (10 sec: 4915.2, 60 sec: 5870.9, 300 sec: 5227.4). Total num frames: 696320. Throughput: 0: 2924.2, 1: 2951.1. Samples: 476184. Policy #0 lag: (min: 34.0, avg: 49.9, max: 72.0) -[2023-10-17 13:27:52,239][125151] Avg episode reward: [(0, '4.650'), (1, '4.630')] -[2023-10-17 13:27:52,564][126004] Updated weights for policy 0, policy_version 1362 (0.0008) -[2023-10-17 13:27:52,628][126005] Updated weights for policy 1, policy_version 1380 (0.0010) -[2023-10-17 13:27:52,946][126004] Updated weights for policy 0, policy_version 1372 (0.0007) -[2023-10-17 13:27:53,012][126005] Updated weights for policy 1, policy_version 1390 (0.0010) -[2023-10-17 13:27:53,385][126005] Updated weights for policy 1, policy_version 1400 (0.0008) -[2023-10-17 13:27:54,820][126004] Updated weights for policy 0, policy_version 1382 (0.0007) -[2023-10-17 13:27:55,214][126004] Updated weights for policy 0, policy_version 1392 (0.0007) -[2023-10-17 13:27:55,594][126004] Updated weights for policy 0, policy_version 1402 (0.0007) -[2023-10-17 13:27:55,641][126005] Updated weights for policy 1, policy_version 1410 (0.0007) -[2023-10-17 13:27:56,018][126005] Updated weights for policy 1, policy_version 1420 (0.0010) -[2023-10-17 13:27:56,395][126005] Updated weights for policy 1, policy_version 1430 (0.0011) -[2023-10-17 13:27:56,777][126005] Updated weights for policy 1, policy_version 1440 (0.0009) -[2023-10-17 13:27:57,238][125151] Fps is (10 sec: 6553.6, 60 sec: 6007.5, 300 sec: 5298.8). Total num frames: 729088. Throughput: 0: 2912.2, 1: 2944.0. Samples: 511220. Policy #0 lag: (min: 31.0, avg: 40.6, max: 63.0) -[2023-10-17 13:27:57,239][125151] Avg episode reward: [(0, '4.440'), (1, '5.180')] -[2023-10-17 13:27:57,652][126004] Updated weights for policy 0, policy_version 1412 (0.0009) -[2023-10-17 13:27:58,048][126004] Updated weights for policy 0, policy_version 1422 (0.0011) -[2023-10-17 13:27:58,428][126004] Updated weights for policy 0, policy_version 1432 (0.0011) -[2023-10-17 13:27:58,722][126005] Updated weights for policy 1, policy_version 1450 (0.0009) -[2023-10-17 13:27:59,104][126005] Updated weights for policy 1, policy_version 1460 (0.0007) -[2023-10-17 13:27:59,485][126005] Updated weights for policy 1, policy_version 1470 (0.0007) -[2023-10-17 13:28:00,554][126004] Updated weights for policy 0, policy_version 1442 (0.0010) -[2023-10-17 13:28:00,943][126004] Updated weights for policy 0, policy_version 1452 (0.0009) -[2023-10-17 13:28:01,108][126005] Updated weights for policy 1, policy_version 1480 (0.0008) -[2023-10-17 13:28:01,339][126004] Updated weights for policy 0, policy_version 1462 (0.0011) -[2023-10-17 13:28:01,495][126005] Updated weights for policy 1, policy_version 1490 (0.0007) -[2023-10-17 13:28:01,727][126004] Updated weights for policy 0, policy_version 1472 (0.0011) -[2023-10-17 13:28:01,875][126005] Updated weights for policy 1, policy_version 1500 (0.0007) -[2023-10-17 13:28:02,238][125151] Fps is (10 sec: 6553.6, 60 sec: 6007.5, 300 sec: 5363.0). Total num frames: 761856. Throughput: 0: 2914.6, 1: 2948.6. Samples: 529332. Policy #0 lag: (min: 13.0, avg: 40.4, max: 47.0) -[2023-10-17 13:28:02,239][125151] Avg episode reward: [(0, '4.300'), (1, '5.210')] -[2023-10-17 13:28:03,477][126005] Updated weights for policy 1, policy_version 1510 (0.0010) -[2023-10-17 13:28:03,518][126004] Updated weights for policy 0, policy_version 1482 (0.0011) -[2023-10-17 13:28:03,857][126005] Updated weights for policy 1, policy_version 1520 (0.0011) -[2023-10-17 13:28:03,895][126004] Updated weights for policy 0, policy_version 1492 (0.0011) -[2023-10-17 13:28:04,239][126005] Updated weights for policy 1, policy_version 1530 (0.0007) -[2023-10-17 13:28:04,283][126004] Updated weights for policy 0, policy_version 1502 (0.0008) -[2023-10-17 13:28:06,257][126005] Updated weights for policy 1, policy_version 1540 (0.0007) -[2023-10-17 13:28:06,584][126004] Updated weights for policy 0, policy_version 1512 (0.0011) -[2023-10-17 13:28:06,637][126005] Updated weights for policy 1, policy_version 1550 (0.0010) -[2023-10-17 13:28:06,968][126004] Updated weights for policy 0, policy_version 1522 (0.0011) -[2023-10-17 13:28:07,018][126005] Updated weights for policy 1, policy_version 1560 (0.0011) -[2023-10-17 13:28:07,238][125151] Fps is (10 sec: 4915.3, 60 sec: 5734.4, 300 sec: 5261.5). Total num frames: 778240. Throughput: 0: 2883.8, 1: 2994.9. Samples: 565956. Policy #0 lag: (min: 13.0, avg: 40.4, max: 47.0) -[2023-10-17 13:28:07,239][125151] Avg episode reward: [(0, '4.120'), (1, '5.260')] -[2023-10-17 13:28:07,364][126004] Updated weights for policy 0, policy_version 1532 (0.0011) -[2023-10-17 13:28:08,793][126005] Updated weights for policy 1, policy_version 1570 (0.0012) -[2023-10-17 13:28:08,994][126004] Updated weights for policy 0, policy_version 1542 (0.0010) -[2023-10-17 13:28:09,177][126005] Updated weights for policy 1, policy_version 1580 (0.0011) -[2023-10-17 13:28:09,375][126004] Updated weights for policy 0, policy_version 1552 (0.0010) -[2023-10-17 13:28:09,562][126005] Updated weights for policy 1, policy_version 1590 (0.0012) -[2023-10-17 13:28:09,759][126004] Updated weights for policy 0, policy_version 1562 (0.0007) -[2023-10-17 13:28:09,943][126005] Updated weights for policy 1, policy_version 1600 (0.0011) -[2023-10-17 13:28:11,812][126004] Updated weights for policy 0, policy_version 1572 (0.0009) -[2023-10-17 13:28:11,966][126005] Updated weights for policy 1, policy_version 1610 (0.0012) -[2023-10-17 13:28:12,190][126004] Updated weights for policy 0, policy_version 1582 (0.0011) -[2023-10-17 13:28:12,238][125151] Fps is (10 sec: 4915.1, 60 sec: 5734.4, 300 sec: 5321.5). Total num frames: 811008. Throughput: 0: 2888.1, 1: 2979.4. Samples: 600952. Policy #0 lag: (min: 31.0, avg: 41.4, max: 63.0) -[2023-10-17 13:28:12,239][125151] Avg episode reward: [(0, '5.240'), (1, '6.000')] -[2023-10-17 13:28:12,338][126005] Updated weights for policy 1, policy_version 1620 (0.0012) -[2023-10-17 13:28:12,570][126004] Updated weights for policy 0, policy_version 1592 (0.0011) -[2023-10-17 13:28:12,717][126005] Updated weights for policy 1, policy_version 1630 (0.0012) -[2023-10-17 13:28:12,799][125846] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000001632_417792.pth... -[2023-10-17 13:28:12,844][125846] Saving new best policy, reward=6.000! -[2023-10-17 13:28:12,877][125686] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000001600_409600.pth... -[2023-10-17 13:28:12,906][125686] Saving new best policy, reward=5.240! -[2023-10-17 13:28:14,468][126004] Updated weights for policy 0, policy_version 1602 (0.0011) -[2023-10-17 13:28:14,616][126005] Updated weights for policy 1, policy_version 1640 (0.0010) -[2023-10-17 13:28:14,856][126004] Updated weights for policy 0, policy_version 1612 (0.0007) -[2023-10-17 13:28:14,998][126005] Updated weights for policy 1, policy_version 1650 (0.0007) -[2023-10-17 13:28:15,244][126004] Updated weights for policy 0, policy_version 1622 (0.0009) -[2023-10-17 13:28:15,375][126005] Updated weights for policy 1, policy_version 1660 (0.0007) -[2023-10-17 13:28:15,629][126004] Updated weights for policy 0, policy_version 1632 (0.0011) -[2023-10-17 13:28:17,150][126005] Updated weights for policy 1, policy_version 1670 (0.0007) -[2023-10-17 13:28:17,238][125151] Fps is (10 sec: 6553.5, 60 sec: 5870.9, 300 sec: 5376.1). Total num frames: 843776. Throughput: 0: 2905.2, 1: 2972.1. Samples: 618808. Policy #0 lag: (min: 31.0, avg: 38.3, max: 63.0) -[2023-10-17 13:28:17,239][125151] Avg episode reward: [(0, '5.600'), (1, '6.290')] -[2023-10-17 13:28:17,241][125686] Saving new best policy, reward=5.600! -[2023-10-17 13:28:17,536][126005] Updated weights for policy 1, policy_version 1680 (0.0009) -[2023-10-17 13:28:17,928][126005] Updated weights for policy 1, policy_version 1690 (0.0011) -[2023-10-17 13:28:17,930][126004] Updated weights for policy 0, policy_version 1642 (0.0007) -[2023-10-17 13:28:18,152][125846] Saving new best policy, reward=6.290! -[2023-10-17 13:28:18,327][126004] Updated weights for policy 0, policy_version 1652 (0.0007) -[2023-10-17 13:28:18,707][126004] Updated weights for policy 0, policy_version 1662 (0.0011) -[2023-10-17 13:28:19,366][126005] Updated weights for policy 1, policy_version 1700 (0.0011) -[2023-10-17 13:28:19,747][126005] Updated weights for policy 1, policy_version 1710 (0.0012) -[2023-10-17 13:28:20,135][126005] Updated weights for policy 1, policy_version 1720 (0.0012) -[2023-10-17 13:28:20,355][126004] Updated weights for policy 0, policy_version 1672 (0.0008) -[2023-10-17 13:28:20,736][126004] Updated weights for policy 0, policy_version 1682 (0.0009) -[2023-10-17 13:28:21,132][126004] Updated weights for policy 0, policy_version 1692 (0.0007) -[2023-10-17 13:28:22,238][125151] Fps is (10 sec: 6553.7, 60 sec: 5870.9, 300 sec: 5426.1). Total num frames: 876544. Throughput: 0: 2942.5, 1: 2984.8. Samples: 654748. Policy #0 lag: (min: 31.0, avg: 54.9, max: 95.0) -[2023-10-17 13:28:22,239][125151] Avg episode reward: [(0, '5.620'), (1, '5.800')] -[2023-10-17 13:28:22,241][125686] Saving new best policy, reward=5.620! -[2023-10-17 13:28:22,290][126005] Updated weights for policy 1, policy_version 1730 (0.0012) -[2023-10-17 13:28:22,683][126005] Updated weights for policy 1, policy_version 1740 (0.0007) -[2023-10-17 13:28:23,064][126005] Updated weights for policy 1, policy_version 1750 (0.0011) -[2023-10-17 13:28:23,076][126004] Updated weights for policy 0, policy_version 1702 (0.0010) -[2023-10-17 13:28:23,453][126005] Updated weights for policy 1, policy_version 1760 (0.0009) -[2023-10-17 13:28:23,456][126004] Updated weights for policy 0, policy_version 1712 (0.0009) -[2023-10-17 13:28:23,836][126004] Updated weights for policy 0, policy_version 1722 (0.0007) -[2023-10-17 13:28:25,304][126005] Updated weights for policy 1, policy_version 1770 (0.0011) -[2023-10-17 13:28:25,687][126005] Updated weights for policy 1, policy_version 1780 (0.0008) -[2023-10-17 13:28:25,865][126004] Updated weights for policy 0, policy_version 1732 (0.0008) -[2023-10-17 13:28:26,072][126005] Updated weights for policy 1, policy_version 1790 (0.0007) -[2023-10-17 13:28:26,245][126004] Updated weights for policy 0, policy_version 1742 (0.0011) -[2023-10-17 13:28:26,628][126004] Updated weights for policy 0, policy_version 1752 (0.0012) -[2023-10-17 13:28:27,238][125151] Fps is (10 sec: 6553.6, 60 sec: 5870.9, 300 sec: 5472.0). Total num frames: 909312. Throughput: 0: 2931.9, 1: 3033.2. Samples: 691636. Policy #0 lag: (min: 31.0, avg: 33.6, max: 50.0) -[2023-10-17 13:28:27,239][125151] Avg episode reward: [(0, '5.760'), (1, '5.510')] -[2023-10-17 13:28:27,251][125686] Saving new best policy, reward=5.760! -[2023-10-17 13:28:27,681][126005] Updated weights for policy 1, policy_version 1800 (0.0011) -[2023-10-17 13:28:28,073][126005] Updated weights for policy 1, policy_version 1810 (0.0010) -[2023-10-17 13:28:28,425][126004] Updated weights for policy 0, policy_version 1762 (0.0011) -[2023-10-17 13:28:28,444][126005] Updated weights for policy 1, policy_version 1820 (0.0007) -[2023-10-17 13:28:28,808][126004] Updated weights for policy 0, policy_version 1772 (0.0010) -[2023-10-17 13:28:29,191][126004] Updated weights for policy 0, policy_version 1782 (0.0011) -[2023-10-17 13:28:29,568][126004] Updated weights for policy 0, policy_version 1792 (0.0011) -[2023-10-17 13:28:30,277][126005] Updated weights for policy 1, policy_version 1830 (0.0008) -[2023-10-17 13:28:30,670][126005] Updated weights for policy 1, policy_version 1840 (0.0007) -[2023-10-17 13:28:31,054][126005] Updated weights for policy 1, policy_version 1850 (0.0007) -[2023-10-17 13:28:31,329][126004] Updated weights for policy 0, policy_version 1802 (0.0011) -[2023-10-17 13:28:31,723][126004] Updated weights for policy 0, policy_version 1812 (0.0011) -[2023-10-17 13:28:32,105][126004] Updated weights for policy 0, policy_version 1822 (0.0011) -[2023-10-17 13:28:32,238][125151] Fps is (10 sec: 6553.7, 60 sec: 6007.5, 300 sec: 5514.3). Total num frames: 942080. Throughput: 0: 2948.3, 1: 3036.8. Samples: 710180. Policy #0 lag: (min: 28.0, avg: 56.9, max: 92.0) -[2023-10-17 13:28:32,239][125151] Avg episode reward: [(0, '6.060'), (1, '5.090')] -[2023-10-17 13:28:32,240][125686] Saving new best policy, reward=6.060! -[2023-10-17 13:28:33,097][126005] Updated weights for policy 1, policy_version 1860 (0.0009) -[2023-10-17 13:28:33,467][126005] Updated weights for policy 1, policy_version 1870 (0.0011) -[2023-10-17 13:28:33,521][126004] Updated weights for policy 0, policy_version 1832 (0.0011) -[2023-10-17 13:28:33,852][126005] Updated weights for policy 1, policy_version 1880 (0.0011) -[2023-10-17 13:28:33,913][126004] Updated weights for policy 0, policy_version 1842 (0.0011) -[2023-10-17 13:28:34,292][126004] Updated weights for policy 0, policy_version 1852 (0.0012) -[2023-10-17 13:28:35,411][126005] Updated weights for policy 1, policy_version 1890 (0.0011) -[2023-10-17 13:28:35,806][126005] Updated weights for policy 1, policy_version 1900 (0.0012) -[2023-10-17 13:28:36,187][126005] Updated weights for policy 1, policy_version 1910 (0.0007) -[2023-10-17 13:28:36,488][126004] Updated weights for policy 0, policy_version 1862 (0.0011) -[2023-10-17 13:28:36,572][126005] Updated weights for policy 1, policy_version 1920 (0.0007) -[2023-10-17 13:28:36,877][126004] Updated weights for policy 0, policy_version 1872 (0.0012) -[2023-10-17 13:28:37,238][125151] Fps is (10 sec: 5734.6, 60 sec: 5870.9, 300 sec: 5491.8). Total num frames: 966656. Throughput: 0: 2962.2, 1: 3055.8. Samples: 746996. Policy #0 lag: (min: 10.0, avg: 36.1, max: 43.0) -[2023-10-17 13:28:37,239][125151] Avg episode reward: [(0, '5.020'), (1, '5.730')] -[2023-10-17 13:28:37,262][126004] Updated weights for policy 0, policy_version 1882 (0.0011) -[2023-10-17 13:28:38,121][126005] Updated weights for policy 1, policy_version 1930 (0.0007) -[2023-10-17 13:28:38,514][126005] Updated weights for policy 1, policy_version 1940 (0.0007) -[2023-10-17 13:28:38,903][126005] Updated weights for policy 1, policy_version 1950 (0.0007) -[2023-10-17 13:28:39,210][126004] Updated weights for policy 0, policy_version 1892 (0.0009) -[2023-10-17 13:28:39,599][126004] Updated weights for policy 0, policy_version 1902 (0.0007) -[2023-10-17 13:28:39,981][126004] Updated weights for policy 0, policy_version 1912 (0.0007) -[2023-10-17 13:28:40,811][126005] Updated weights for policy 1, policy_version 1960 (0.0007) -[2023-10-17 13:28:41,198][126005] Updated weights for policy 1, policy_version 1970 (0.0009) -[2023-10-17 13:28:41,585][126005] Updated weights for policy 1, policy_version 1980 (0.0007) -[2023-10-17 13:28:42,238][125151] Fps is (10 sec: 5734.3, 60 sec: 5870.9, 300 sec: 5530.3). Total num frames: 999424. Throughput: 0: 2931.6, 1: 3088.9. Samples: 782140. Policy #0 lag: (min: 31.0, avg: 42.1, max: 63.0) -[2023-10-17 13:28:42,239][125151] Avg episode reward: [(0, '5.210'), (1, '5.320')] -[2023-10-17 13:28:42,326][126004] Updated weights for policy 0, policy_version 1922 (0.0008) -[2023-10-17 13:28:42,704][126004] Updated weights for policy 0, policy_version 1932 (0.0008) -[2023-10-17 13:28:43,086][126004] Updated weights for policy 0, policy_version 1942 (0.0008) -[2023-10-17 13:28:43,132][126005] Updated weights for policy 1, policy_version 1990 (0.0011) -[2023-10-17 13:28:43,473][126004] Updated weights for policy 0, policy_version 1952 (0.0011) -[2023-10-17 13:28:43,510][126005] Updated weights for policy 1, policy_version 2000 (0.0010) -[2023-10-17 13:28:43,906][126005] Updated weights for policy 1, policy_version 2010 (0.0007) -[2023-10-17 13:28:45,166][126004] Updated weights for policy 0, policy_version 1962 (0.0012) -[2023-10-17 13:28:45,563][126004] Updated weights for policy 0, policy_version 1972 (0.0011) -[2023-10-17 13:28:45,707][126005] Updated weights for policy 1, policy_version 2020 (0.0007) -[2023-10-17 13:28:45,935][126004] Updated weights for policy 0, policy_version 1982 (0.0011) -[2023-10-17 13:28:46,076][126005] Updated weights for policy 1, policy_version 2030 (0.0007) -[2023-10-17 13:28:46,463][126005] Updated weights for policy 1, policy_version 2040 (0.0007) -[2023-10-17 13:28:47,238][125151] Fps is (10 sec: 6553.4, 60 sec: 6144.0, 300 sec: 5566.2). Total num frames: 1032192. Throughput: 0: 2934.4, 1: 3088.6. Samples: 800368. Policy #0 lag: (min: 5.0, avg: 24.5, max: 37.0) -[2023-10-17 13:28:47,239][125151] Avg episode reward: [(0, '5.530'), (1, '5.600')] -[2023-10-17 13:28:48,222][126004] Updated weights for policy 0, policy_version 1992 (0.0011) -[2023-10-17 13:28:48,230][126005] Updated weights for policy 1, policy_version 2050 (0.0008) -[2023-10-17 13:28:48,599][126004] Updated weights for policy 0, policy_version 2002 (0.0012) -[2023-10-17 13:28:48,611][126005] Updated weights for policy 1, policy_version 2060 (0.0011) -[2023-10-17 13:28:48,982][126004] Updated weights for policy 0, policy_version 2012 (0.0010) -[2023-10-17 13:28:48,998][126005] Updated weights for policy 1, policy_version 2070 (0.0011) -[2023-10-17 13:28:49,381][126005] Updated weights for policy 1, policy_version 2080 (0.0011) -[2023-10-17 13:28:50,916][126005] Updated weights for policy 1, policy_version 2090 (0.0012) -[2023-10-17 13:28:51,205][126004] Updated weights for policy 0, policy_version 2022 (0.0009) -[2023-10-17 13:28:51,289][126005] Updated weights for policy 1, policy_version 2100 (0.0011) -[2023-10-17 13:28:51,583][126004] Updated weights for policy 0, policy_version 2032 (0.0008) -[2023-10-17 13:28:51,670][126005] Updated weights for policy 1, policy_version 2110 (0.0011) -[2023-10-17 13:28:51,972][126004] Updated weights for policy 0, policy_version 2042 (0.0007) -[2023-10-17 13:28:52,238][125151] Fps is (10 sec: 6553.7, 60 sec: 6144.0, 300 sec: 5599.6). Total num frames: 1064960. Throughput: 0: 2922.0, 1: 3080.0. Samples: 836048. Policy #0 lag: (min: 30.0, avg: 52.1, max: 62.0) -[2023-10-17 13:28:52,239][125151] Avg episode reward: [(0, '5.250'), (1, '5.500')] -[2023-10-17 13:28:53,798][126005] Updated weights for policy 1, policy_version 2120 (0.0012) -[2023-10-17 13:28:53,837][126004] Updated weights for policy 0, policy_version 2052 (0.0009) -[2023-10-17 13:28:54,181][126005] Updated weights for policy 1, policy_version 2130 (0.0012) -[2023-10-17 13:28:54,226][126004] Updated weights for policy 0, policy_version 2062 (0.0010) -[2023-10-17 13:28:54,562][126005] Updated weights for policy 1, policy_version 2140 (0.0012) -[2023-10-17 13:28:54,601][126004] Updated weights for policy 0, policy_version 2072 (0.0011) -[2023-10-17 13:28:56,190][126004] Updated weights for policy 0, policy_version 2082 (0.0008) -[2023-10-17 13:28:56,242][126005] Updated weights for policy 1, policy_version 2150 (0.0009) -[2023-10-17 13:28:56,578][126004] Updated weights for policy 0, policy_version 2092 (0.0012) -[2023-10-17 13:28:56,622][126005] Updated weights for policy 1, policy_version 2160 (0.0008) -[2023-10-17 13:28:56,961][126004] Updated weights for policy 0, policy_version 2102 (0.0012) -[2023-10-17 13:28:57,010][126005] Updated weights for policy 1, policy_version 2170 (0.0007) -[2023-10-17 13:28:57,238][125151] Fps is (10 sec: 5734.5, 60 sec: 6007.5, 300 sec: 5577.2). Total num frames: 1089536. Throughput: 0: 2919.0, 1: 3090.9. Samples: 871396. Policy #0 lag: (min: 30.0, avg: 52.1, max: 62.0) -[2023-10-17 13:28:57,239][125151] Avg episode reward: [(0, '5.070'), (1, '4.770')] -[2023-10-17 13:28:57,348][126004] Updated weights for policy 0, policy_version 2112 (0.0012) -[2023-10-17 13:28:58,431][126005] Updated weights for policy 1, policy_version 2180 (0.0009) -[2023-10-17 13:28:58,811][126005] Updated weights for policy 1, policy_version 2190 (0.0012) -[2023-10-17 13:28:59,073][126004] Updated weights for policy 0, policy_version 2122 (0.0012) -[2023-10-17 13:28:59,191][126005] Updated weights for policy 1, policy_version 2200 (0.0012) -[2023-10-17 13:28:59,462][126004] Updated weights for policy 0, policy_version 2132 (0.0012) -[2023-10-17 13:28:59,832][126004] Updated weights for policy 0, policy_version 2142 (0.0011) -[2023-10-17 13:29:01,419][126005] Updated weights for policy 1, policy_version 2210 (0.0011) -[2023-10-17 13:29:01,763][126004] Updated weights for policy 0, policy_version 2152 (0.0011) -[2023-10-17 13:29:01,796][126005] Updated weights for policy 1, policy_version 2220 (0.0012) -[2023-10-17 13:29:02,145][126004] Updated weights for policy 0, policy_version 2162 (0.0011) -[2023-10-17 13:29:02,192][126005] Updated weights for policy 1, policy_version 2230 (0.0011) -[2023-10-17 13:29:02,238][125151] Fps is (10 sec: 4915.3, 60 sec: 5870.9, 300 sec: 5556.2). Total num frames: 1114112. Throughput: 0: 2938.9, 1: 3092.4. Samples: 890212. Policy #0 lag: (min: 4.0, avg: 22.1, max: 36.0) -[2023-10-17 13:29:02,239][125151] Avg episode reward: [(0, '4.830'), (1, '4.990')] -[2023-10-17 13:29:02,529][126004] Updated weights for policy 0, policy_version 2172 (0.0010) -[2023-10-17 13:29:02,560][126005] Updated weights for policy 1, policy_version 2240 (0.0011) -[2023-10-17 13:29:04,258][126004] Updated weights for policy 0, policy_version 2182 (0.0011) -[2023-10-17 13:29:04,645][126004] Updated weights for policy 0, policy_version 2192 (0.0012) -[2023-10-17 13:29:04,766][126005] Updated weights for policy 1, policy_version 2250 (0.0011) -[2023-10-17 13:29:05,027][126004] Updated weights for policy 0, policy_version 2202 (0.0011) -[2023-10-17 13:29:05,158][126005] Updated weights for policy 1, policy_version 2260 (0.0012) -[2023-10-17 13:29:05,543][126005] Updated weights for policy 1, policy_version 2270 (0.0012) -[2023-10-17 13:29:06,908][126004] Updated weights for policy 0, policy_version 2212 (0.0008) -[2023-10-17 13:29:07,238][125151] Fps is (10 sec: 5734.4, 60 sec: 6144.0, 300 sec: 5586.8). Total num frames: 1146880. Throughput: 0: 2986.7, 1: 3076.9. Samples: 927608. Policy #0 lag: (min: 31.0, avg: 47.6, max: 63.0) -[2023-10-17 13:29:07,239][125151] Avg episode reward: [(0, '5.820'), (1, '5.790')] -[2023-10-17 13:29:07,294][126004] Updated weights for policy 0, policy_version 2222 (0.0011) -[2023-10-17 13:29:07,409][126005] Updated weights for policy 1, policy_version 2280 (0.0008) -[2023-10-17 13:29:07,678][126004] Updated weights for policy 0, policy_version 2232 (0.0012) -[2023-10-17 13:29:07,787][126005] Updated weights for policy 1, policy_version 2290 (0.0011) -[2023-10-17 13:29:08,164][126005] Updated weights for policy 1, policy_version 2300 (0.0012) -[2023-10-17 13:29:09,564][126004] Updated weights for policy 0, policy_version 2242 (0.0011) -[2023-10-17 13:29:09,958][126004] Updated weights for policy 0, policy_version 2252 (0.0009) -[2023-10-17 13:29:10,089][126005] Updated weights for policy 1, policy_version 2310 (0.0011) -[2023-10-17 13:29:10,332][126004] Updated weights for policy 0, policy_version 2262 (0.0008) -[2023-10-17 13:29:10,468][126005] Updated weights for policy 1, policy_version 2320 (0.0011) -[2023-10-17 13:29:10,713][126004] Updated weights for policy 0, policy_version 2272 (0.0012) -[2023-10-17 13:29:10,861][126005] Updated weights for policy 1, policy_version 2330 (0.0011) -[2023-10-17 13:29:12,238][125151] Fps is (10 sec: 6553.4, 60 sec: 6144.0, 300 sec: 5615.6). Total num frames: 1179648. Throughput: 0: 3001.4, 1: 3058.0. Samples: 964308. Policy #0 lag: (min: 34.0, avg: 47.5, max: 72.0) -[2023-10-17 13:29:12,239][125151] Avg episode reward: [(0, '5.490'), (1, '5.830')] -[2023-10-17 13:29:12,379][126004] Updated weights for policy 0, policy_version 2282 (0.0011) -[2023-10-17 13:29:12,437][126005] Updated weights for policy 1, policy_version 2340 (0.0011) -[2023-10-17 13:29:12,761][126004] Updated weights for policy 0, policy_version 2292 (0.0011) -[2023-10-17 13:29:12,812][126005] Updated weights for policy 1, policy_version 2350 (0.0011) -[2023-10-17 13:29:13,149][126004] Updated weights for policy 0, policy_version 2302 (0.0012) -[2023-10-17 13:29:13,195][126005] Updated weights for policy 1, policy_version 2360 (0.0010) -[2023-10-17 13:29:15,044][126005] Updated weights for policy 1, policy_version 2370 (0.0012) -[2023-10-17 13:29:15,297][126004] Updated weights for policy 0, policy_version 2312 (0.0011) -[2023-10-17 13:29:15,428][126005] Updated weights for policy 1, policy_version 2380 (0.0011) -[2023-10-17 13:29:15,683][126004] Updated weights for policy 0, policy_version 2322 (0.0012) -[2023-10-17 13:29:15,812][126005] Updated weights for policy 1, policy_version 2390 (0.0012) -[2023-10-17 13:29:16,069][126004] Updated weights for policy 0, policy_version 2332 (0.0012) -[2023-10-17 13:29:16,194][126005] Updated weights for policy 1, policy_version 2400 (0.0010) -[2023-10-17 13:29:17,238][125151] Fps is (10 sec: 6553.6, 60 sec: 6144.0, 300 sec: 5642.8). Total num frames: 1212416. Throughput: 0: 2983.1, 1: 3064.8. Samples: 982336. Policy #0 lag: (min: 31.0, avg: 50.9, max: 64.0) -[2023-10-17 13:29:17,239][125151] Avg episode reward: [(0, '5.550'), (1, '5.630')] -[2023-10-17 13:29:18,302][126004] Updated weights for policy 0, policy_version 2342 (0.0012) -[2023-10-17 13:29:18,370][126005] Updated weights for policy 1, policy_version 2410 (0.0011) -[2023-10-17 13:29:18,680][126004] Updated weights for policy 0, policy_version 2352 (0.0012) -[2023-10-17 13:29:18,748][126005] Updated weights for policy 1, policy_version 2420 (0.0012) -[2023-10-17 13:29:19,065][126004] Updated weights for policy 0, policy_version 2362 (0.0012) -[2023-10-17 13:29:19,132][126005] Updated weights for policy 1, policy_version 2430 (0.0009) -[2023-10-17 13:29:20,515][126004] Updated weights for policy 0, policy_version 2372 (0.0012) -[2023-10-17 13:29:20,904][126004] Updated weights for policy 0, policy_version 2382 (0.0011) -[2023-10-17 13:29:21,282][126004] Updated weights for policy 0, policy_version 2392 (0.0007) -[2023-10-17 13:29:21,409][126005] Updated weights for policy 1, policy_version 2440 (0.0007) -[2023-10-17 13:29:21,800][126005] Updated weights for policy 1, policy_version 2450 (0.0008) -[2023-10-17 13:29:22,171][126005] Updated weights for policy 1, policy_version 2460 (0.0009) -[2023-10-17 13:29:22,238][125151] Fps is (10 sec: 5734.5, 60 sec: 6007.5, 300 sec: 5622.3). Total num frames: 1236992. Throughput: 0: 2975.3, 1: 3031.3. Samples: 1017292. Policy #0 lag: (min: 31.0, avg: 46.5, max: 68.0) -[2023-10-17 13:29:22,239][125151] Avg episode reward: [(0, '6.130'), (1, '5.420')] -[2023-10-17 13:29:22,240][125686] Saving new best policy, reward=6.130! -[2023-10-17 13:29:23,287][126004] Updated weights for policy 0, policy_version 2402 (0.0008) -[2023-10-17 13:29:23,681][126004] Updated weights for policy 0, policy_version 2412 (0.0007) -[2023-10-17 13:29:24,019][126005] Updated weights for policy 1, policy_version 2470 (0.0012) -[2023-10-17 13:29:24,061][126004] Updated weights for policy 0, policy_version 2422 (0.0007) -[2023-10-17 13:29:24,404][126005] Updated weights for policy 1, policy_version 2480 (0.0009) -[2023-10-17 13:29:24,450][126004] Updated weights for policy 0, policy_version 2432 (0.0010) -[2023-10-17 13:29:24,800][126005] Updated weights for policy 1, policy_version 2490 (0.0007) -[2023-10-17 13:29:26,172][126004] Updated weights for policy 0, policy_version 2442 (0.0007) -[2023-10-17 13:29:26,560][126004] Updated weights for policy 0, policy_version 2452 (0.0007) -[2023-10-17 13:29:26,697][126005] Updated weights for policy 1, policy_version 2500 (0.0009) -[2023-10-17 13:29:26,947][126004] Updated weights for policy 0, policy_version 2462 (0.0010) -[2023-10-17 13:29:27,076][126005] Updated weights for policy 1, policy_version 2510 (0.0011) -[2023-10-17 13:29:27,238][125151] Fps is (10 sec: 5734.4, 60 sec: 6007.5, 300 sec: 5647.8). Total num frames: 1269760. Throughput: 0: 3007.5, 1: 3010.5. Samples: 1052948. Policy #0 lag: (min: 31.0, avg: 47.0, max: 76.0) -[2023-10-17 13:29:27,239][125151] Avg episode reward: [(0, '5.350'), (1, '5.820')] -[2023-10-17 13:29:27,454][126005] Updated weights for policy 1, policy_version 2520 (0.0012) -[2023-10-17 13:29:28,659][126004] Updated weights for policy 0, policy_version 2472 (0.0008) -[2023-10-17 13:29:29,037][126004] Updated weights for policy 0, policy_version 2482 (0.0009) -[2023-10-17 13:29:29,156][126005] Updated weights for policy 1, policy_version 2530 (0.0012) -[2023-10-17 13:29:29,419][126004] Updated weights for policy 0, policy_version 2492 (0.0009) -[2023-10-17 13:29:29,546][126005] Updated weights for policy 1, policy_version 2540 (0.0011) -[2023-10-17 13:29:29,936][126005] Updated weights for policy 1, policy_version 2550 (0.0011) -[2023-10-17 13:29:30,318][126005] Updated weights for policy 1, policy_version 2560 (0.0012) -[2023-10-17 13:29:31,709][126004] Updated weights for policy 0, policy_version 2502 (0.0012) -[2023-10-17 13:29:32,082][126005] Updated weights for policy 1, policy_version 2570 (0.0012) -[2023-10-17 13:29:32,087][126004] Updated weights for policy 0, policy_version 2512 (0.0012) -[2023-10-17 13:29:32,238][125151] Fps is (10 sec: 5734.4, 60 sec: 5870.9, 300 sec: 5628.3). Total num frames: 1294336. Throughput: 0: 3008.3, 1: 3020.2. Samples: 1071648. Policy #0 lag: (min: 31.0, avg: 43.8, max: 63.0) -[2023-10-17 13:29:32,239][125151] Avg episode reward: [(0, '5.070'), (1, '4.800')] -[2023-10-17 13:29:32,465][126005] Updated weights for policy 1, policy_version 2580 (0.0010) -[2023-10-17 13:29:32,472][126004] Updated weights for policy 0, policy_version 2522 (0.0008) -[2023-10-17 13:29:32,847][126005] Updated weights for policy 1, policy_version 2590 (0.0011) -[2023-10-17 13:29:34,261][126004] Updated weights for policy 0, policy_version 2532 (0.0007) -[2023-10-17 13:29:34,658][126004] Updated weights for policy 0, policy_version 2542 (0.0007) -[2023-10-17 13:29:34,703][126005] Updated weights for policy 1, policy_version 2600 (0.0009) -[2023-10-17 13:29:35,051][126004] Updated weights for policy 0, policy_version 2552 (0.0007) -[2023-10-17 13:29:35,096][126005] Updated weights for policy 1, policy_version 2610 (0.0011) -[2023-10-17 13:29:35,468][126005] Updated weights for policy 1, policy_version 2620 (0.0007) -[2023-10-17 13:29:37,179][126004] Updated weights for policy 0, policy_version 2562 (0.0007) -[2023-10-17 13:29:37,238][125151] Fps is (10 sec: 5734.4, 60 sec: 6007.5, 300 sec: 5652.3). Total num frames: 1327104. Throughput: 0: 3027.0, 1: 2999.6. Samples: 1107244. Policy #0 lag: (min: 37.0, avg: 54.9, max: 58.0) -[2023-10-17 13:29:37,239][125151] Avg episode reward: [(0, '4.910'), (1, '5.870')] -[2023-10-17 13:29:37,566][126004] Updated weights for policy 0, policy_version 2572 (0.0007) -[2023-10-17 13:29:37,733][126005] Updated weights for policy 1, policy_version 2630 (0.0010) -[2023-10-17 13:29:37,954][126004] Updated weights for policy 0, policy_version 2582 (0.0007) -[2023-10-17 13:29:38,119][126005] Updated weights for policy 1, policy_version 2640 (0.0012) -[2023-10-17 13:29:38,336][126004] Updated weights for policy 0, policy_version 2592 (0.0007) -[2023-10-17 13:29:38,515][126005] Updated weights for policy 1, policy_version 2650 (0.0011) -[2023-10-17 13:29:40,519][126004] Updated weights for policy 0, policy_version 2602 (0.0012) -[2023-10-17 13:29:40,715][126005] Updated weights for policy 1, policy_version 2660 (0.0011) -[2023-10-17 13:29:40,902][126004] Updated weights for policy 0, policy_version 2612 (0.0008) -[2023-10-17 13:29:41,101][126005] Updated weights for policy 1, policy_version 2670 (0.0011) -[2023-10-17 13:29:41,296][126004] Updated weights for policy 0, policy_version 2622 (0.0007) -[2023-10-17 13:29:41,484][126005] Updated weights for policy 1, policy_version 2680 (0.0011) -[2023-10-17 13:29:42,238][125151] Fps is (10 sec: 6553.7, 60 sec: 6007.5, 300 sec: 5675.1). Total num frames: 1359872. Throughput: 0: 3030.1, 1: 2967.7. Samples: 1141300. Policy #0 lag: (min: 31.0, avg: 37.2, max: 63.0) -[2023-10-17 13:29:42,239][125151] Avg episode reward: [(0, '5.430'), (1, '4.940')] -[2023-10-17 13:29:42,903][126004] Updated weights for policy 0, policy_version 2632 (0.0011) -[2023-10-17 13:29:43,288][126004] Updated weights for policy 0, policy_version 2642 (0.0012) -[2023-10-17 13:29:43,654][126005] Updated weights for policy 1, policy_version 2690 (0.0012) -[2023-10-17 13:29:43,672][126004] Updated weights for policy 0, policy_version 2652 (0.0008) -[2023-10-17 13:29:44,042][126005] Updated weights for policy 1, policy_version 2700 (0.0012) -[2023-10-17 13:29:44,422][126005] Updated weights for policy 1, policy_version 2710 (0.0012) -[2023-10-17 13:29:44,818][126005] Updated weights for policy 1, policy_version 2720 (0.0012) -[2023-10-17 13:29:45,604][126004] Updated weights for policy 0, policy_version 2662 (0.0007) -[2023-10-17 13:29:45,991][126004] Updated weights for policy 0, policy_version 2672 (0.0007) -[2023-10-17 13:29:46,377][126004] Updated weights for policy 0, policy_version 2682 (0.0008) -[2023-10-17 13:29:46,526][126005] Updated weights for policy 1, policy_version 2730 (0.0011) -[2023-10-17 13:29:46,902][126005] Updated weights for policy 1, policy_version 2740 (0.0011) -[2023-10-17 13:29:47,238][125151] Fps is (10 sec: 5734.2, 60 sec: 5870.9, 300 sec: 5656.3). Total num frames: 1384448. Throughput: 0: 3012.3, 1: 2964.0. Samples: 1159148. Policy #0 lag: (min: 31.0, avg: 38.5, max: 63.0) -[2023-10-17 13:29:47,239][125151] Avg episode reward: [(0, '4.780'), (1, '5.640')] -[2023-10-17 13:29:47,288][126005] Updated weights for policy 1, policy_version 2750 (0.0011) -[2023-10-17 13:29:48,588][126004] Updated weights for policy 0, policy_version 2692 (0.0008) -[2023-10-17 13:29:48,974][126004] Updated weights for policy 0, policy_version 2702 (0.0009) -[2023-10-17 13:29:49,293][126005] Updated weights for policy 1, policy_version 2760 (0.0010) -[2023-10-17 13:29:49,367][126004] Updated weights for policy 0, policy_version 2712 (0.0009) -[2023-10-17 13:29:49,674][126005] Updated weights for policy 1, policy_version 2770 (0.0011) -[2023-10-17 13:29:50,061][126005] Updated weights for policy 1, policy_version 2780 (0.0012) -[2023-10-17 13:29:50,925][126004] Updated weights for policy 0, policy_version 2722 (0.0011) -[2023-10-17 13:29:51,322][126004] Updated weights for policy 0, policy_version 2732 (0.0012) -[2023-10-17 13:29:51,639][126005] Updated weights for policy 1, policy_version 2790 (0.0012) -[2023-10-17 13:29:51,736][126004] Updated weights for policy 0, policy_version 2742 (0.0011) -[2023-10-17 13:29:52,029][126005] Updated weights for policy 1, policy_version 2800 (0.0012) -[2023-10-17 13:29:52,108][126004] Updated weights for policy 0, policy_version 2752 (0.0011) -[2023-10-17 13:29:52,238][125151] Fps is (10 sec: 5734.4, 60 sec: 5870.9, 300 sec: 5677.9). Total num frames: 1417216. Throughput: 0: 2970.0, 1: 2970.9. Samples: 1194948. Policy #0 lag: (min: 27.0, avg: 41.1, max: 61.0) -[2023-10-17 13:29:52,239][125151] Avg episode reward: [(0, '5.900'), (1, '5.330')] -[2023-10-17 13:29:52,405][126005] Updated weights for policy 1, policy_version 2810 (0.0012) -[2023-10-17 13:29:54,246][126005] Updated weights for policy 1, policy_version 2820 (0.0011) -[2023-10-17 13:29:54,265][126004] Updated weights for policy 0, policy_version 2762 (0.0010) -[2023-10-17 13:29:54,636][126005] Updated weights for policy 1, policy_version 2830 (0.0012) -[2023-10-17 13:29:54,640][126004] Updated weights for policy 0, policy_version 2772 (0.0009) -[2023-10-17 13:29:55,019][126004] Updated weights for policy 0, policy_version 2782 (0.0008) -[2023-10-17 13:29:55,026][126005] Updated weights for policy 1, policy_version 2840 (0.0010) -[2023-10-17 13:29:56,887][126004] Updated weights for policy 0, policy_version 2792 (0.0012) -[2023-10-17 13:29:57,238][125151] Fps is (10 sec: 5734.5, 60 sec: 5870.9, 300 sec: 5660.0). Total num frames: 1441792. Throughput: 0: 2939.0, 1: 2967.5. Samples: 1230100. Policy #0 lag: (min: 27.0, avg: 41.1, max: 61.0) -[2023-10-17 13:29:57,239][125151] Avg episode reward: [(0, '5.550'), (1, '5.240')] -[2023-10-17 13:29:57,278][126004] Updated weights for policy 0, policy_version 2802 (0.0011) -[2023-10-17 13:29:57,305][126005] Updated weights for policy 1, policy_version 2850 (0.0011) -[2023-10-17 13:29:57,665][126004] Updated weights for policy 0, policy_version 2812 (0.0011) -[2023-10-17 13:29:57,698][126005] Updated weights for policy 1, policy_version 2860 (0.0011) -[2023-10-17 13:29:58,078][126005] Updated weights for policy 1, policy_version 2870 (0.0011) -[2023-10-17 13:29:58,461][126005] Updated weights for policy 1, policy_version 2880 (0.0011) -[2023-10-17 13:29:59,992][126004] Updated weights for policy 0, policy_version 2822 (0.0010) -[2023-10-17 13:30:00,290][126005] Updated weights for policy 1, policy_version 2890 (0.0010) -[2023-10-17 13:30:00,375][126004] Updated weights for policy 0, policy_version 2832 (0.0011) -[2023-10-17 13:30:00,671][126005] Updated weights for policy 1, policy_version 2900 (0.0012) -[2023-10-17 13:30:00,761][126004] Updated weights for policy 0, policy_version 2842 (0.0010) -[2023-10-17 13:30:01,061][126005] Updated weights for policy 1, policy_version 2910 (0.0010) -[2023-10-17 13:30:02,238][125151] Fps is (10 sec: 5734.3, 60 sec: 6007.4, 300 sec: 5680.5). Total num frames: 1474560. Throughput: 0: 2920.7, 1: 2969.9. Samples: 1247416. Policy #0 lag: (min: 14.0, avg: 33.9, max: 53.0) -[2023-10-17 13:30:02,239][125151] Avg episode reward: [(0, '5.800'), (1, '5.550')] -[2023-10-17 13:30:02,627][126005] Updated weights for policy 1, policy_version 2920 (0.0011) -[2023-10-17 13:30:02,691][126004] Updated weights for policy 0, policy_version 2852 (0.0008) -[2023-10-17 13:30:03,015][126005] Updated weights for policy 1, policy_version 2930 (0.0012) -[2023-10-17 13:30:03,081][126004] Updated weights for policy 0, policy_version 2862 (0.0007) -[2023-10-17 13:30:03,417][126005] Updated weights for policy 1, policy_version 2940 (0.0012) -[2023-10-17 13:30:03,464][126004] Updated weights for policy 0, policy_version 2872 (0.0012) -[2023-10-17 13:30:05,055][126005] Updated weights for policy 1, policy_version 2950 (0.0009) -[2023-10-17 13:30:05,130][126004] Updated weights for policy 0, policy_version 2882 (0.0011) -[2023-10-17 13:30:05,443][126005] Updated weights for policy 1, policy_version 2960 (0.0011) -[2023-10-17 13:30:05,507][126004] Updated weights for policy 0, policy_version 2892 (0.0012) -[2023-10-17 13:30:05,832][126005] Updated weights for policy 1, policy_version 2970 (0.0011) -[2023-10-17 13:30:05,888][126004] Updated weights for policy 0, policy_version 2902 (0.0011) -[2023-10-17 13:30:06,276][126004] Updated weights for policy 0, policy_version 2912 (0.0012) -[2023-10-17 13:30:07,238][125151] Fps is (10 sec: 6553.4, 60 sec: 6007.4, 300 sec: 5700.1). Total num frames: 1507328. Throughput: 0: 2935.1, 1: 2975.3. Samples: 1283260. Policy #0 lag: (min: 4.0, avg: 19.3, max: 36.0) -[2023-10-17 13:30:07,240][125151] Avg episode reward: [(0, '5.130'), (1, '5.230')] -[2023-10-17 13:30:07,717][126005] Updated weights for policy 1, policy_version 2980 (0.0011) -[2023-10-17 13:30:08,098][126005] Updated weights for policy 1, policy_version 2990 (0.0011) -[2023-10-17 13:30:08,246][126004] Updated weights for policy 0, policy_version 2922 (0.0011) -[2023-10-17 13:30:08,475][126005] Updated weights for policy 1, policy_version 3000 (0.0010) -[2023-10-17 13:30:08,624][126004] Updated weights for policy 0, policy_version 2932 (0.0011) -[2023-10-17 13:30:09,031][126004] Updated weights for policy 0, policy_version 2942 (0.0012) -[2023-10-17 13:30:10,143][126005] Updated weights for policy 1, policy_version 3010 (0.0011) -[2023-10-17 13:30:10,534][126005] Updated weights for policy 1, policy_version 3020 (0.0010) -[2023-10-17 13:30:10,577][126004] Updated weights for policy 0, policy_version 2952 (0.0011) -[2023-10-17 13:30:10,906][126005] Updated weights for policy 1, policy_version 3030 (0.0009) -[2023-10-17 13:30:10,971][126004] Updated weights for policy 0, policy_version 2962 (0.0010) -[2023-10-17 13:30:11,287][126005] Updated weights for policy 1, policy_version 3040 (0.0009) -[2023-10-17 13:30:11,352][126004] Updated weights for policy 0, policy_version 2972 (0.0010) -[2023-10-17 13:30:12,238][125151] Fps is (10 sec: 6553.6, 60 sec: 6007.5, 300 sec: 5718.9). Total num frames: 1540096. Throughput: 0: 2931.2, 1: 2989.4. Samples: 1319376. Policy #0 lag: (min: 21.0, avg: 36.1, max: 53.0) -[2023-10-17 13:30:12,239][125151] Avg episode reward: [(0, '5.120'), (1, '5.280')] -[2023-10-17 13:30:12,250][125846] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000003040_778240.pth... -[2023-10-17 13:30:12,250][125686] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000002976_761856.pth... -[2023-10-17 13:30:12,287][125686] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000000448_114688.pth -[2023-10-17 13:30:12,297][125846] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000000480_122880.pth -[2023-10-17 13:30:13,310][126005] Updated weights for policy 1, policy_version 3050 (0.0011) -[2023-10-17 13:30:13,387][126004] Updated weights for policy 0, policy_version 2982 (0.0011) -[2023-10-17 13:30:13,697][126005] Updated weights for policy 1, policy_version 3060 (0.0008) -[2023-10-17 13:30:13,764][126004] Updated weights for policy 0, policy_version 2992 (0.0010) -[2023-10-17 13:30:14,084][126005] Updated weights for policy 1, policy_version 3070 (0.0009) -[2023-10-17 13:30:14,149][126004] Updated weights for policy 0, policy_version 3002 (0.0010) -[2023-10-17 13:30:15,797][126005] Updated weights for policy 1, policy_version 3080 (0.0008) -[2023-10-17 13:30:15,970][126004] Updated weights for policy 0, policy_version 3012 (0.0011) -[2023-10-17 13:30:16,178][126005] Updated weights for policy 1, policy_version 3090 (0.0008) -[2023-10-17 13:30:16,355][126004] Updated weights for policy 0, policy_version 3022 (0.0011) -[2023-10-17 13:30:16,565][126005] Updated weights for policy 1, policy_version 3100 (0.0007) -[2023-10-17 13:30:16,734][126004] Updated weights for policy 0, policy_version 3032 (0.0011) -[2023-10-17 13:30:17,238][125151] Fps is (10 sec: 6553.8, 60 sec: 6007.5, 300 sec: 5736.8). Total num frames: 1572864. Throughput: 0: 2932.2, 1: 2995.1. Samples: 1338376. Policy #0 lag: (min: 31.0, avg: 52.0, max: 83.0) -[2023-10-17 13:30:17,239][125151] Avg episode reward: [(0, '5.010'), (1, '5.300')] -[2023-10-17 13:30:18,479][126005] Updated weights for policy 1, policy_version 3110 (0.0011) -[2023-10-17 13:30:18,570][126004] Updated weights for policy 0, policy_version 3042 (0.0011) -[2023-10-17 13:30:18,861][126005] Updated weights for policy 1, policy_version 3120 (0.0011) -[2023-10-17 13:30:18,960][126004] Updated weights for policy 0, policy_version 3052 (0.0011) -[2023-10-17 13:30:19,249][126005] Updated weights for policy 1, policy_version 3130 (0.0011) -[2023-10-17 13:30:19,351][126004] Updated weights for policy 0, policy_version 3062 (0.0011) -[2023-10-17 13:30:19,748][126004] Updated weights for policy 0, policy_version 3072 (0.0011) -[2023-10-17 13:30:21,214][126005] Updated weights for policy 1, policy_version 3140 (0.0011) -[2023-10-17 13:30:21,478][126004] Updated weights for policy 0, policy_version 3082 (0.0009) -[2023-10-17 13:30:21,609][126005] Updated weights for policy 1, policy_version 3150 (0.0011) -[2023-10-17 13:30:21,874][126004] Updated weights for policy 0, policy_version 3092 (0.0008) -[2023-10-17 13:30:21,978][126005] Updated weights for policy 1, policy_version 3160 (0.0008) -[2023-10-17 13:30:22,238][125151] Fps is (10 sec: 4915.2, 60 sec: 5870.9, 300 sec: 5685.1). Total num frames: 1589248. Throughput: 0: 2962.0, 1: 3003.2. Samples: 1375680. Policy #0 lag: (min: 31.0, avg: 50.7, max: 93.0) -[2023-10-17 13:30:22,240][125151] Avg episode reward: [(0, '5.460'), (1, '4.860')] -[2023-10-17 13:30:22,264][126004] Updated weights for policy 0, policy_version 3102 (0.0007) -[2023-10-17 13:30:24,059][126005] Updated weights for policy 1, policy_version 3170 (0.0008) -[2023-10-17 13:30:24,120][126004] Updated weights for policy 0, policy_version 3112 (0.0011) -[2023-10-17 13:30:24,443][126005] Updated weights for policy 1, policy_version 3180 (0.0011) -[2023-10-17 13:30:24,507][126004] Updated weights for policy 0, policy_version 3122 (0.0012) -[2023-10-17 13:30:24,834][126005] Updated weights for policy 1, policy_version 3190 (0.0012) -[2023-10-17 13:30:24,905][126004] Updated weights for policy 0, policy_version 3132 (0.0008) -[2023-10-17 13:30:25,214][126005] Updated weights for policy 1, policy_version 3200 (0.0010) -[2023-10-17 13:30:26,746][126004] Updated weights for policy 0, policy_version 3142 (0.0010) -[2023-10-17 13:30:27,123][126005] Updated weights for policy 1, policy_version 3210 (0.0011) -[2023-10-17 13:30:27,126][126004] Updated weights for policy 0, policy_version 3152 (0.0011) -[2023-10-17 13:30:27,238][125151] Fps is (10 sec: 4915.3, 60 sec: 5870.9, 300 sec: 5703.0). Total num frames: 1622016. Throughput: 0: 2994.2, 1: 3020.0. Samples: 1411940. Policy #0 lag: (min: 31.0, avg: 43.2, max: 63.0) -[2023-10-17 13:30:27,239][125151] Avg episode reward: [(0, '5.780'), (1, '5.310')] -[2023-10-17 13:30:27,509][126005] Updated weights for policy 1, policy_version 3220 (0.0011) -[2023-10-17 13:30:27,513][126004] Updated weights for policy 0, policy_version 3162 (0.0012) -[2023-10-17 13:30:27,913][126005] Updated weights for policy 1, policy_version 3230 (0.0011) -[2023-10-17 13:30:29,433][126004] Updated weights for policy 0, policy_version 3172 (0.0011) -[2023-10-17 13:30:29,703][126005] Updated weights for policy 1, policy_version 3240 (0.0008) -[2023-10-17 13:30:29,827][126004] Updated weights for policy 0, policy_version 3182 (0.0012) -[2023-10-17 13:30:30,095][126005] Updated weights for policy 1, policy_version 3250 (0.0008) -[2023-10-17 13:30:30,213][126004] Updated weights for policy 0, policy_version 3192 (0.0010) -[2023-10-17 13:30:30,480][126005] Updated weights for policy 1, policy_version 3260 (0.0007) -[2023-10-17 13:30:32,036][126004] Updated weights for policy 0, policy_version 3202 (0.0007) -[2023-10-17 13:30:32,238][125151] Fps is (10 sec: 6553.7, 60 sec: 6007.5, 300 sec: 5720.1). Total num frames: 1654784. Throughput: 0: 2994.1, 1: 3011.3. Samples: 1429392. Policy #0 lag: (min: 15.0, avg: 26.9, max: 47.0) -[2023-10-17 13:30:32,239][125151] Avg episode reward: [(0, '5.260'), (1, '5.130')] -[2023-10-17 13:30:32,285][126005] Updated weights for policy 1, policy_version 3270 (0.0010) -[2023-10-17 13:30:32,420][126004] Updated weights for policy 0, policy_version 3212 (0.0007) -[2023-10-17 13:30:32,670][126005] Updated weights for policy 1, policy_version 3280 (0.0011) -[2023-10-17 13:30:32,801][126004] Updated weights for policy 0, policy_version 3222 (0.0007) -[2023-10-17 13:30:33,060][126005] Updated weights for policy 1, policy_version 3290 (0.0012) -[2023-10-17 13:30:33,189][126004] Updated weights for policy 0, policy_version 3232 (0.0010) -[2023-10-17 13:30:34,872][126004] Updated weights for policy 0, policy_version 3242 (0.0009) -[2023-10-17 13:30:35,225][126005] Updated weights for policy 1, policy_version 3300 (0.0011) -[2023-10-17 13:30:35,264][126004] Updated weights for policy 0, policy_version 3252 (0.0008) -[2023-10-17 13:30:35,593][126005] Updated weights for policy 1, policy_version 3310 (0.0012) -[2023-10-17 13:30:35,662][126004] Updated weights for policy 0, policy_version 3262 (0.0011) -[2023-10-17 13:30:35,976][126005] Updated weights for policy 1, policy_version 3320 (0.0012) -[2023-10-17 13:30:37,238][125151] Fps is (10 sec: 6553.6, 60 sec: 6007.5, 300 sec: 5736.6). Total num frames: 1687552. Throughput: 0: 2989.2, 1: 2983.0. Samples: 1463700. Policy #0 lag: (min: 19.0, avg: 38.4, max: 53.0) -[2023-10-17 13:30:37,239][125151] Avg episode reward: [(0, '5.690'), (1, '4.990')] -[2023-10-17 13:30:37,831][126004] Updated weights for policy 0, policy_version 3272 (0.0007) -[2023-10-17 13:30:37,838][126005] Updated weights for policy 1, policy_version 3330 (0.0011) -[2023-10-17 13:30:38,206][126004] Updated weights for policy 0, policy_version 3282 (0.0008) -[2023-10-17 13:30:38,221][126005] Updated weights for policy 1, policy_version 3340 (0.0007) -[2023-10-17 13:30:38,606][126004] Updated weights for policy 0, policy_version 3292 (0.0007) -[2023-10-17 13:30:38,610][126005] Updated weights for policy 1, policy_version 3350 (0.0007) -[2023-10-17 13:30:38,986][126005] Updated weights for policy 1, policy_version 3360 (0.0008) -[2023-10-17 13:30:40,508][126004] Updated weights for policy 0, policy_version 3302 (0.0008) -[2023-10-17 13:30:40,893][126004] Updated weights for policy 0, policy_version 3312 (0.0007) -[2023-10-17 13:30:41,264][126005] Updated weights for policy 1, policy_version 3370 (0.0008) -[2023-10-17 13:30:41,284][126004] Updated weights for policy 0, policy_version 3322 (0.0007) -[2023-10-17 13:30:41,638][126005] Updated weights for policy 1, policy_version 3380 (0.0010) -[2023-10-17 13:30:42,017][126005] Updated weights for policy 1, policy_version 3390 (0.0012) -[2023-10-17 13:30:42,238][125151] Fps is (10 sec: 6553.6, 60 sec: 6007.5, 300 sec: 5752.5). Total num frames: 1720320. Throughput: 0: 2989.5, 1: 2966.7. Samples: 1498128. Policy #0 lag: (min: 45.0, avg: 52.6, max: 80.0) -[2023-10-17 13:30:42,239][125151] Avg episode reward: [(0, '6.150'), (1, '5.800')] -[2023-10-17 13:30:42,250][125686] Saving new best policy, reward=6.150! -[2023-10-17 13:30:43,493][126004] Updated weights for policy 0, policy_version 3332 (0.0009) -[2023-10-17 13:30:43,722][126005] Updated weights for policy 1, policy_version 3400 (0.0009) -[2023-10-17 13:30:43,868][126004] Updated weights for policy 0, policy_version 3342 (0.0010) -[2023-10-17 13:30:44,115][126005] Updated weights for policy 1, policy_version 3410 (0.0011) -[2023-10-17 13:30:44,256][126004] Updated weights for policy 0, policy_version 3352 (0.0007) -[2023-10-17 13:30:44,489][126005] Updated weights for policy 1, policy_version 3420 (0.0011) -[2023-10-17 13:30:46,060][126005] Updated weights for policy 1, policy_version 3430 (0.0011) -[2023-10-17 13:30:46,260][126004] Updated weights for policy 0, policy_version 3362 (0.0009) -[2023-10-17 13:30:46,450][126005] Updated weights for policy 1, policy_version 3440 (0.0009) -[2023-10-17 13:30:46,644][126004] Updated weights for policy 0, policy_version 3372 (0.0011) -[2023-10-17 13:30:46,831][126005] Updated weights for policy 1, policy_version 3450 (0.0009) -[2023-10-17 13:30:47,028][126004] Updated weights for policy 0, policy_version 3382 (0.0011) -[2023-10-17 13:30:47,238][125151] Fps is (10 sec: 5734.3, 60 sec: 6007.5, 300 sec: 5736.5). Total num frames: 1744896. Throughput: 0: 3013.7, 1: 2960.6. Samples: 1516260. Policy #0 lag: (min: 45.0, avg: 52.6, max: 80.0) -[2023-10-17 13:30:47,239][125151] Avg episode reward: [(0, '5.630'), (1, '4.970')] -[2023-10-17 13:30:47,417][126004] Updated weights for policy 0, policy_version 3392 (0.0011) -[2023-10-17 13:30:48,705][126005] Updated weights for policy 1, policy_version 3460 (0.0009) -[2023-10-17 13:30:49,097][126005] Updated weights for policy 1, policy_version 3470 (0.0009) -[2023-10-17 13:30:49,486][126005] Updated weights for policy 1, policy_version 3480 (0.0007) -[2023-10-17 13:30:49,638][126004] Updated weights for policy 0, policy_version 3402 (0.0007) -[2023-10-17 13:30:50,015][126004] Updated weights for policy 0, policy_version 3412 (0.0007) -[2023-10-17 13:30:50,412][126004] Updated weights for policy 0, policy_version 3422 (0.0007) -[2023-10-17 13:30:51,112][126005] Updated weights for policy 1, policy_version 3490 (0.0007) -[2023-10-17 13:30:51,490][126005] Updated weights for policy 1, policy_version 3500 (0.0007) -[2023-10-17 13:30:51,892][126005] Updated weights for policy 1, policy_version 3510 (0.0007) -[2023-10-17 13:30:52,238][125151] Fps is (10 sec: 4915.2, 60 sec: 5870.9, 300 sec: 5721.2). Total num frames: 1769472. Throughput: 0: 2980.3, 1: 2997.7. Samples: 1552268. Policy #0 lag: (min: 3.0, avg: 29.8, max: 56.0) -[2023-10-17 13:30:52,239][125151] Avg episode reward: [(0, '5.850'), (1, '5.520')] -[2023-10-17 13:30:52,275][126005] Updated weights for policy 1, policy_version 3520 (0.0007) -[2023-10-17 13:30:52,654][126004] Updated weights for policy 0, policy_version 3432 (0.0011) -[2023-10-17 13:30:53,038][126004] Updated weights for policy 0, policy_version 3442 (0.0010) -[2023-10-17 13:30:53,419][126004] Updated weights for policy 0, policy_version 3452 (0.0012) -[2023-10-17 13:30:54,606][126005] Updated weights for policy 1, policy_version 3530 (0.0007) -[2023-10-17 13:30:54,990][126005] Updated weights for policy 1, policy_version 3540 (0.0007) -[2023-10-17 13:30:55,178][126004] Updated weights for policy 0, policy_version 3462 (0.0011) -[2023-10-17 13:30:55,366][126005] Updated weights for policy 1, policy_version 3550 (0.0007) -[2023-10-17 13:30:55,567][126004] Updated weights for policy 0, policy_version 3472 (0.0011) -[2023-10-17 13:30:55,971][126004] Updated weights for policy 0, policy_version 3482 (0.0012) -[2023-10-17 13:30:57,238][125151] Fps is (10 sec: 5734.5, 60 sec: 6007.5, 300 sec: 5736.4). Total num frames: 1802240. Throughput: 0: 2982.2, 1: 2993.7. Samples: 1588292. Policy #0 lag: (min: 35.0, avg: 61.4, max: 83.0) -[2023-10-17 13:30:57,238][125151] Avg episode reward: [(0, '5.610'), (1, '5.480')] -[2023-10-17 13:30:57,444][126005] Updated weights for policy 1, policy_version 3560 (0.0009) -[2023-10-17 13:30:57,457][126004] Updated weights for policy 0, policy_version 3492 (0.0010) -[2023-10-17 13:30:57,827][126005] Updated weights for policy 1, policy_version 3570 (0.0010) -[2023-10-17 13:30:57,850][126004] Updated weights for policy 0, policy_version 3502 (0.0011) -[2023-10-17 13:30:58,213][126005] Updated weights for policy 1, policy_version 3580 (0.0012) -[2023-10-17 13:30:58,228][126004] Updated weights for policy 0, policy_version 3512 (0.0011) -[2023-10-17 13:30:59,836][126005] Updated weights for policy 1, policy_version 3590 (0.0012) -[2023-10-17 13:30:59,924][126004] Updated weights for policy 0, policy_version 3522 (0.0011) -[2023-10-17 13:31:00,227][126005] Updated weights for policy 1, policy_version 3600 (0.0011) -[2023-10-17 13:31:00,313][126004] Updated weights for policy 0, policy_version 3532 (0.0011) -[2023-10-17 13:31:00,615][126005] Updated weights for policy 1, policy_version 3610 (0.0007) -[2023-10-17 13:31:00,700][126004] Updated weights for policy 0, policy_version 3542 (0.0011) -[2023-10-17 13:31:01,086][126004] Updated weights for policy 0, policy_version 3552 (0.0011) -[2023-10-17 13:31:02,238][125151] Fps is (10 sec: 6553.5, 60 sec: 6007.5, 300 sec: 5751.2). Total num frames: 1835008. Throughput: 0: 2979.6, 1: 2976.1. Samples: 1606380. Policy #0 lag: (min: 5.0, avg: 30.7, max: 47.0) -[2023-10-17 13:31:02,239][125151] Avg episode reward: [(0, '5.220'), (1, '5.820')] -[2023-10-17 13:31:02,388][126005] Updated weights for policy 1, policy_version 3620 (0.0011) -[2023-10-17 13:31:02,643][126004] Updated weights for policy 0, policy_version 3562 (0.0009) -[2023-10-17 13:31:02,768][126005] Updated weights for policy 1, policy_version 3630 (0.0011) -[2023-10-17 13:31:03,032][126004] Updated weights for policy 0, policy_version 3572 (0.0007) -[2023-10-17 13:31:03,158][126005] Updated weights for policy 1, policy_version 3640 (0.0011) -[2023-10-17 13:31:03,413][126004] Updated weights for policy 0, policy_version 3582 (0.0007) -[2023-10-17 13:31:03,747][125151] Keyboard interrupt detected in the event loop EvtLoop [Runner_EvtLoop, process=main process 125151], exiting... -[2023-10-17 13:31:03,748][125151] Runner profile tree view: -main_loop: 286.9511 -[2023-10-17 13:31:03,749][125151] Collected {0: 917504, 1: 933888}, FPS: 5624.0 -[2023-10-17 13:31:03,749][125846] Stopping Batcher_1... -[2023-10-17 13:31:03,749][125686] Stopping Batcher_0... -[2023-10-17 13:31:03,749][125846] Loop batcher_evt_loop terminating... -[2023-10-17 13:31:03,750][125686] Loop batcher_evt_loop terminating... -[2023-10-17 13:31:03,750][125846] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000003648_933888.pth... -[2023-10-17 13:31:03,751][125686] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000003584_917504.pth... -[2023-10-17 13:31:03,754][126037] Stopping RolloutWorker_w0... -[2023-10-17 13:31:03,754][126037] Loop rollout_proc0_evt_loop terminating... -[2023-10-17 13:31:03,757][126043] Stopping RolloutWorker_w2... -[2023-10-17 13:31:03,757][126043] Loop rollout_proc2_evt_loop terminating... -[2023-10-17 13:31:03,758][126044] Stopping RolloutWorker_w6... -[2023-10-17 13:31:03,758][126637] Stopping RolloutWorker_w14... -[2023-10-17 13:31:03,758][126041] Stopping RolloutWorker_w4... -[2023-10-17 13:31:03,758][126041] Loop rollout_proc4_evt_loop terminating... -[2023-10-17 13:31:03,758][126044] Loop rollout_proc6_evt_loop terminating... -[2023-10-17 13:31:03,758][126637] Loop rollout_proc14_evt_loop terminating... -[2023-10-17 13:31:03,758][126045] Stopping RolloutWorker_w7... -[2023-10-17 13:31:03,758][126047] Stopping RolloutWorker_w10... -[2023-10-17 13:31:03,758][126050] Stopping RolloutWorker_w13... -[2023-10-17 13:31:03,758][126042] Stopping RolloutWorker_w5... -[2023-10-17 13:31:03,759][126047] Loop rollout_proc10_evt_loop terminating... -[2023-10-17 13:31:03,759][126045] Loop rollout_proc7_evt_loop terminating... -[2023-10-17 13:31:03,759][126042] Loop rollout_proc5_evt_loop terminating... -[2023-10-17 13:31:03,759][126050] Loop rollout_proc13_evt_loop terminating... -[2023-10-17 13:31:03,759][126051] Stopping RolloutWorker_w12... -[2023-10-17 13:31:03,759][126051] Loop rollout_proc12_evt_loop terminating... -[2023-10-17 13:31:03,759][126048] Stopping RolloutWorker_w9... -[2023-10-17 13:31:03,760][126048] Loop rollout_proc9_evt_loop terminating... -[2023-10-17 13:31:03,760][126039] Stopping RolloutWorker_w1... -[2023-10-17 13:31:03,761][126039] Loop rollout_proc1_evt_loop terminating... -[2023-10-17 13:31:03,762][126046] Stopping RolloutWorker_w8... -[2023-10-17 13:31:03,762][126046] Loop rollout_proc8_evt_loop terminating... -[2023-10-17 13:31:03,762][126049] Stopping RolloutWorker_w11... -[2023-10-17 13:31:03,762][126049] Loop rollout_proc11_evt_loop terminating... -[2023-10-17 13:31:03,764][126669] Stopping RolloutWorker_w15... -[2023-10-17 13:31:03,765][126040] Stopping RolloutWorker_w3... -[2023-10-17 13:31:03,765][126669] Loop rollout_proc15_evt_loop terminating... -[2023-10-17 13:31:03,765][126040] Loop rollout_proc3_evt_loop terminating... -[2023-10-17 13:31:03,767][126004] Weights refcount: 2 0 -[2023-10-17 13:31:03,768][126004] Stopping InferenceWorker_p0-w0... -[2023-10-17 13:31:03,768][126004] Loop inference_proc0-0_evt_loop terminating... -[2023-10-17 13:31:03,774][126005] Weights refcount: 2 0 -[2023-10-17 13:31:03,776][126005] Stopping InferenceWorker_p1-w0... -[2023-10-17 13:31:03,777][126005] Loop inference_proc1-0_evt_loop terminating... -[2023-10-17 13:31:03,798][125686] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000001600_409600.pth -[2023-10-17 13:31:03,799][125846] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000001632_417792.pth -[2023-10-17 13:31:03,804][125686] Stopping LearnerWorker_p0... -[2023-10-17 13:31:03,804][125686] Loop learner_proc0_evt_loop terminating... -[2023-10-17 13:31:03,805][125846] Stopping LearnerWorker_p1... -[2023-10-17 13:31:03,806][125846] Loop learner_proc1_evt_loop terminating... +version https://git-lfs.github.com/spec/v1 +oid sha256:5dc3031718e8d564eaa29cface6e4eae56eddedab674e3b68501219b05360837 +size 27940874