diff --git a/al_0.6_g_0.97_id_11_seed_970611/action_probs.tar.gz b/al_0.6_g_0.97_id_11_seed_970611/action_probs.tar.gz new file mode 100644 index 0000000000000000000000000000000000000000..c8c8617aaf341b7bd347be042454456e82a90aa5 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/action_probs.tar.gz @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c049396988b744bfb1838ce6843ba872b767651bd00740eef158995fde231b88 +size 24751900 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints.tar.gz b/al_0.6_g_0.97_id_11_seed_970611/checkpoints.tar.gz new file mode 100644 index 0000000000000000000000000000000000000000..4d3c5e3d3b7360e786b0bc4e43ca69a6cddaa39e --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints.tar.gz @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92e78c2843757dd176a71117c42a1b1f406ad6b7e7a0e2d0027a7fdfa6684c2c +size 622706515 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00000.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00000.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2fa7be7a2594bcc023a8545fb9b5454d92f897a8 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00000.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a47c68c363a6480b36a8e283a1c17a77e1aec3d70dc5faa24de54f3c2a95d2b4 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00001.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00001.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8e2be0b7f8278b6f6e1b25c9b7fa9445a071e8f8 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00001.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a1b212133708e466eff15365f99b7dad1ad5fb965c04134aff7aa355886ca56 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00002.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00002.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..61a8054d9875b6a1df9b7413b254c6af4eda35db --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00002.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:adc073aabaa28b3700a9b5c8c6542cd0e98ac863d6bdfd0ef175ba5a84ec27e9 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00003.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00003.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4b54700f479f61c4bfec0803002eef4e111cf211 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00003.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77b527df0450f2c3ec9654a3b5ae6a360206b0d6c36e0147d6ec336987684e49 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00004.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00004.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..53accafbd06b9b851394fcac97d33868353c1832 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00004.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0aa3d6b8a9dd5f066871618c3b9c5320a2410ffdc256872695978005cc0a0156 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00005.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00005.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..748d1f67b3ba6d3b2b6adca77359b2f98ad08a82 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00005.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9797722437f47127144ce08255d018680fa9ee4e69261e30b94a90c5a824dda4 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00006.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00006.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c99b010685f04f34062cbef0742be3e0891c36ba --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00006.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f823538b6069e4041fa3c4f79c2112e92bbcfc67fcd7c65e59bcc91dc6ad6a7 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00007.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00007.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b3563b1d0aa809e9b00d39fce28480a01ad6145e --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00007.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f71f7debd54a8ec8c64eacc1d37c1027dc6d3f412812f7327a06b2163d7bf62 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00008.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00008.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..139bbc5c122509c3cedfaa998df7b69eed11230a --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00008.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca812c6055ea386eb602db31cd94664f14f65110ba9d2b8debd8b06e11855f09 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00009.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00009.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..744a695b5ab28b13888b9e4b8380f31f2811b826 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00009.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b866b22df1546beeccf6e2cc1fc18bbb92492ebf31642885b2d2481f80c628b +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00010.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00010.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..bd3913c0f3d1a13dd6c00e6121db8afddf3668c3 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00010.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27fb75d0255de779aa2ab94de70e2cf4521418d716e28d77aedcc7538cec5a8b +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00011.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00011.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..57a4fb2d22bb986cba893de0a024f8948c4ba90f --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00011.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d316cc61d0a01582c2be6917fc8d47692e8bf7f2f0705e139d2b95759a07469 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00012.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00012.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9cf642a5a10aa158b29290b32b4a4271c21ba78d --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00012.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fddaedb7fdc0d7895941b8433b6b5230340dd7b7990b63bd3f4fc4af561909e2 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00013.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00013.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2d361a48bbfec9ae111b1f56db6a5238a4ab21a4 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00013.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aaea0b9b54cc74389cac7ba27abead058f30a0fc417c523be77acfd432717a97 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00014.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00014.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0682ad0449c0adeded4cacc4578b7667e0bbe32a --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00014.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:797e03cd20d10cc210d9589abb4f4114366108f05246b36a869bf787887ca899 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00015.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00015.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ecbe21760f71b037e7f38d04f4d986347d7d453e --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00015.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:967e9151ab80eb4df1bed014a1288a1e71baecd90b93227ed759a882c14f9789 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00016.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00016.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e53f91185e97f3782336450dc7836bfa8c051b91 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00016.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d35ad59fdb1b9611e6af0a8d6ef5f7f88460975e25dffee8f69d496b1039416 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00017.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00017.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..36815d85e1f52ac6b57139ae051cefbbf47280a9 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00017.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:816d8cd02a289588c2c82033a93507281b781b0775c58861222429c1a6bd9461 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00018.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00018.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..fe460ebc46c5a7702e857fd89e2ab9abd8f2eda3 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00018.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a72de9b2cb6fb5dfc9183accf74dcab93fffc6b6a6ac0b9265475566717f72c +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00019.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00019.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4983972e9a7542acc6b8da40c64490c8444468e5 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00019.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:62bbe66dde307211eb6585e6464e926acf99406c82aae13c01367d200445fbd8 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00020.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00020.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..513963ef35ddf95d1f75d20205c3e105ddcb0fea --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00020.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:513f29e73b85217a9a28651205a20ab0efd59b5aec71bee8c8bb66fd613dec44 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00021.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00021.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..97d5a95d467f23641b47a401f962bd47deb21283 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00021.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27141ea01b4558a3c634e1508fa704e3e1b3cec7a93a07aba61a0320e2e3f424 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00022.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00022.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e91ac1fd8842119c5769432fd36334ad8f15cc10 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00022.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10a0c99cec87ffe005ad135950fca6110d9d515fefb89ac4f6c211782fd6c5ea +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00023.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00023.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..03df1df4aef28872ca19c9ca18b09116bed7a48d --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00023.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0135dd468730501eb58be678296ae70a7980d23ae98ec1b9b37f1ac83346949d +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00024.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00024.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5bca709f908aed4a332ee26be298ebe84d40926f --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00024.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a6efa08c786ac3966b6fb84db14c188640adb202a3548c58d8d6c9bfa602dc2 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00025.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00025.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..bd82b4f167df9dc9f25c8bb85084f5bf2d0daf8e --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00025.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f916ce1342ea472b6c716bae4f07841ee53748163de85d8beb53ed3a4d3be150 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00026.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00026.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..18cb6a171f118c5f0d60df6002df6496be4b1184 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00026.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ff9c6b0cf15bd119c89f2bd5a7aa9fb36f6ae9c8dcb4b0209421e453a619c47 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00027.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00027.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d1a53cbc608da8de0bc4df1c3af81e145365e893 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00027.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24204415be86ff77f94d67ba345100ac64efc4b85cb283f4de4cc8a35acd53ca +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00028.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00028.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..19cda38ee9dee3cd3943aab2dda6052799c27bd1 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00028.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2dadabe6227b9d94777f3870e4ff4d8b6251688a351abb5d371f4ce240f76e0 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00029.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00029.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..bcf3d71b8cd6397598800d2e002293c8143a090d --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00029.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee6bb61ba8866645754b5865602a2a03487a2608945af6d25ff81d77590ac002 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00030.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00030.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3c06a6ee0f16ca2b60611922573c9b3a5979b062 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00030.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:62bfcabbd59a02df6538168c770f79bb3b9222592a0075812c3b46750215f281 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00031.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00031.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..38b64ea54ab9c3e25c824b582dbcf4ccc8acc296 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00031.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f7c43508bc3c2ef6175424e44a7c6aa999c5a793379f1b11395ca3b0cd3ca7b +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00032.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00032.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..389cb2ffb285aecef9be303c433e1bdbddf54dc4 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00032.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e96a50d5174511b20351e0eed08f0aaa24372a731b3f174120f069c41055f930 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00033.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00033.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ff12e6be24bc07764c2f31fe2105972a03c5dbf9 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00033.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c9460dd4b8dc792651b2c0c0a6998b53488bc9aa260eb5246a2a0cea56d4cf3 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00034.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00034.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..99f04731b5506bbd8ed293bfc194140f171f8149 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00034.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:190c7524bab6287091c83fed59d25d82f0b2dd0658e4386215b422cd677908d1 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00035.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00035.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..cddefeaf6d17c198701a114a9156e66c3aa27a38 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00035.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bfa4d376815e248d9c36df62c34bbc6028f24b5055f1f428a8c626701f749d6b +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00036.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00036.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c80d227ddc0cfe0131070fea7e2b3011981e6740 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00036.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d1cd8e21e20fcc7f6603e8711652bfc7be93058fd7bf09a9b43bef01a7cd4a5 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00037.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00037.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5ada0dda22bad9111c29b3c548f5e42ec7f0c41a --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00037.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0981b646a88187712f77a3ff754fc76f80d2029d1e216e8629ffa172b007b23 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00038.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00038.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..59d5470723b5df6107bcd06cc97b20a34a4b414c --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00038.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba0b8ded20c341b51d5f76ee043a7a94cb32eff5e3369e84a8ba68151540284c +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00039.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00039.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d7bc1830c753fb5eae61928304cf4a65c889a75c --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00039.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd4213af1821f9c3019ff114d3ca493968fd442fb107ac4ccf67b726850ba4e4 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00040.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00040.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2145df9d6c10537cbd665516ded4ccca0f7760fa --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00040.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:deb4531700a938689ffa3993cff77515ba5cab361ab3a8044355dae53cf1f06e +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00041.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00041.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..243f06310f8aed243902a68325840342dbed9bbf --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00041.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b10391c40f4e0c09491b7b39bfd39408d0c8ef17de3a14d75974a24ec517e9b8 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00042.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00042.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..06951f0dec84853dea767f24f380382584e330da --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00042.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0eb229bfe79ff7415044561ad06c4fd0dd520d8248c7273a941d3a83d73d0dc0 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00043.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00043.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7c05cc903e2dbc3b9203ecd964831c4e151690c9 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00043.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02f51b33387399d772017038d1d2080ac984959696e2557bbd7a4d86ffc01d6a +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00044.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00044.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..df685b1e5b8b2473818e2a1bd43ab0babc48e354 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00044.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1bf0b9befd7d710484393b49ef6ef0fefbf23721e3270cd9e7e2180c5b931060 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00045.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00045.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6c7f3438745b9efe882731f351a75685422d941b --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00045.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2cf770b75914123c1c63fb3c41808dcbe99a0e8b4e09ffac93826e898f2d56b +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00046.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00046.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..eed272bd4aeb7cfdf540023fd14a9f05465ea0f2 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00046.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0cfccc37a7ed35d3f63274e0b6cc9b78afa187d5064f73e00888f0714dbf70d +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00047.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00047.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a89320f4c260201d1ec8f1e59e293fc963aee1f8 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00047.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:779e41cc480da07f33155121473c9978f95f1883d1e9700f68f23ceb9b98d51d +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00048.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00048.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9bdb85ee9d8f917d4ff47b6c37745fca139dda6d --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00048.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:302368f8ed054e4c5bc79115a522a783911412929a11f72612d20b30a246b7f5 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00049.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00049.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..fd35be602fa7f09a652e3683a2cc928188a6dd10 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00049.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0527a0eb38fada9f3ba1f700119ebb4df1b9fddae60df3a95414be7b907aa9f1 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00050.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00050.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0b3669ab4451c0edd69381fcb12a0d1e25bbd85b --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00050.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8edbedacd4ca5f519b2399bff90bb8aac60d10847e1689c899647f23f583144e +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00051.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00051.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..bb4e5c47474a23e0e4e92781db0804b52e87972e --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00051.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c78abddac40acf7fdfb08252c159ed42eca9bc06b1e5cda3013593f86483ff6 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00052.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00052.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1db3a3f460dd65a5a1539fa72802f2423fa676a0 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00052.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3435bb10a40891686ea76e92769c26788b8f68103bdf83560b24bc6fe71c81ec +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00053.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00053.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9867959369ba73248c56076db63b530f7fd70a66 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00053.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f25acef6d5bca07fce2cf6bfa99e6632b46a7aaac9e91f1d91e7ce30aadd2214 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00054.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00054.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..bcd7cb2613d667b1361701ed61b5253aae38ce41 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00054.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b30607812281e78569678c4fdc2638e1be29b2f8f013d921754da1cb4957bcd +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00055.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00055.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9b39ee818cfd5f7371b7198a4e391384c9a5fa4d --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00055.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:572074b314126f18218885becda94c7f451426c26b93e9026f505d88f6546af3 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00056.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00056.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..eb65ef1f146a6894fed81fb6606a78ed4c8e8911 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00056.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13bb3f2c65a7b05670afdda6eae5c62e2556d6cef73b2d7ff67f8b476c148d29 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00057.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00057.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f9815730bc53d4b8c8ab8828f9cc3956e27c8058 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00057.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a222726c94b32b7650e9d173963c1bc2fe920d122fedad37cca8c3e1dedde2ea +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00058.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00058.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..95d008e9bda35b95c6c8696b8b8af4a9496087ec --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00058.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:051b8b9de964a35ce7626a497ef8a60686332a7d1d755b6fea5a836bab636ea7 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00059.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00059.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f259542c3df4176980b467cb0886ab5bb7ff4413 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00059.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e28bcbfe5e0bf08348c9bc3bc8840de0ecf6fb7daafb77176bb2c3d5f069b9e6 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00060.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00060.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5880a726bd7bbcda94ac99149f7dac933d4edc71 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00060.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7895f62b251f69922e1058962d249f6f8f065c83a3173516a2cd1e8ea59df8df +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00061.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00061.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8d04ab58d08574b353e63f00545442cfb4259c27 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00061.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:530d20aecb2d583c8ab0d17ae73475054ca7d9124c26770bbc8aa4df0fc03432 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00062.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00062.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..dc43f084886d168b34434ac4b8d99e7a3ead6b17 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00062.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e5bf2e7da9c3ca052961981fd62ad48e1550ba6193d29518dddf18d7f8ecd7d +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00063.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00063.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f45aa05101cfa489786f56acd914e5544f2e5cf3 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00063.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:871ba118714015ca852b380a627b43b5b84ec317da3a06097d02ece0a06788fe +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00064.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00064.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..494e667287fa4db466e661d9f38ef400305936da --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00064.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b68bb7785e44eb1c72681539c7382420a3f8e339ee0f84f674a31603da27a5c4 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00065.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00065.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..954609c63c1400b87c24c5bd3751edae437955fd --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00065.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31eeec4cfb19762f9669e6f9b7353ebc1096b70d1b5383722ba4ee6ba6cf8827 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00066.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00066.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..291ee488716056c5cd20e62f33481b421050ff2d --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00066.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:751e300def5c2c02d296a5c83bbf110b6d14aa354c7debd1d5497324816482d6 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00067.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00067.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..74d6b74a51a6b662721e3bfaa119d640be00cbdd --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00067.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:971c8677300f3306ced5b2573d18ca4feea36cebbe3c06631994fb8567424e09 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00068.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00068.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..82ece8ac83601238d7d17129e6764be83fcc013f --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00068.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:769275707d11fc1260029c2b6b9efbb1ad7c0e7e283c1be7b6bd6e2cb4ea6c64 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00069.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00069.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0d7dd6a5868835b44336815ddabe399942cea968 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00069.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b628ac3ff89f4a84aca0cb8eaa660f34795c14fb94a0eeafc620314a4bf4885a +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00070.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00070.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..bb4be55d1587822876edcd7a2315aaceff9790bf --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00070.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eec14b040c4f977bbc1f915caa80d844d1b7260a9a76ee59cd80d284cd7f5974 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00071.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00071.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..014840cbe1bf827c92ef64f5f33bb650dd55c5be --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00071.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:447d2cf6916d70678c9ecce0feec4b1a2e39abc1c437907e9c57e5b4b4f5225b +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00072.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00072.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..061818dcfedbf967dd6f70fc5d94f8ffecc42c47 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00072.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7e32f13ede6533b4ca3ddbcc9e18e149432ac9651d54a64361587363cb5f04f +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00073.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00073.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7bf936bc0d74d5f0a557e44f0eff91ec6de1c3bb --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00073.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02a06731faced19aa519c2897bbaa049b2da9f1d92b135144fc921c9c72b652e +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00074.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00074.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8ee6fadf6c88a48663f79a073eed788c02efa92a --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00074.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32b2fdc6f9ad5076d6262952948e864d60da0a1f6165732af42438532248af38 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00075.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00075.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..950940ce9b16a1308c20e4906addc4da20d6f1cb --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00075.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7dc6afdf14ebfe949e74a70407b86da6f8411c78442816c740bebcdf71111b84 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00076.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00076.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4130c5fc8ced36ed04984be7b27c114c7176b72d --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00076.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6255b46a77e2f714a9587d979018b5a286605cf99ca312d79e7b824291ec69b +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00077.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00077.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f0cc5725415857c175f5eb336c27ff336301e840 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00077.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:901675e1008eccce10b819538b27ba4a02d908c9b85058db21ab757ddb1e23ef +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00078.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00078.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ad78ef9bc1d7656518857036698c575e67d5b20b --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00078.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a71303fd77d67443642a11d997b55cc6230101b9fd42819a4bffed79c55888a9 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00079.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00079.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4b8f88245d9fff4c3f93850484da61735496c3c2 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00079.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ba57e8920ba49aa05fae984f19798b8cdde5834033e09d02ccc42633bc7eabb +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00080.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00080.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8ac07fd9f14a11239d1b126a7a9079f8d5c9b540 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00080.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c4001d487c66bf845ff9af3aeebe15ba5e261bfcbc0d630883321cbaa2ee659 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00081.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00081.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..770587688b7453f9d94c6dce174263966c2d0ee7 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00081.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e90db27c9533bdb2e127d17a76648c5e95bf903107900f579bea27c2c5c69c1 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00082.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00082.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e6d3f27fd8d441ecb7e6f150f4adccaf23f85745 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00082.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b34b18e22e71c2486fcfb9ef681b0cb87852f7da6514cf724b048ff234d99d9 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00083.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00083.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..66511780921afab08acb337dfde1ee20fbe8345e --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00083.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3ca0698c31569b4e410244076ef2d4c89eb071deaa44bd22a8f3e284331aaed +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00084.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00084.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4e9cb11169ecc4879b7e30badd0545e6386d9d06 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00084.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6dcebc632179bf3160451d36c00d4dce1909c24856ffd37b05bbae3b8fa4632 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00085.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00085.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f46d9f4d77385a67e31693574a8eae5d1662f623 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00085.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0404220003bdb0d752940b16803cae38be55dd321d1aa345fe5ab4577860d406 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00086.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00086.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a1725e3d0972d75bc6029eaa14c0106839571a34 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00086.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29ee3e5e46cc68ee04e8d5a3f56e52bad79afe453c6514e29297e10b5b7e9b25 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00087.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00087.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..aa6be905ee30aad93919cbc5a8b529ca446a3c22 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00087.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:631e0e1e1fedd271bfbae88104202f1d5851a02a80b5c4fab13609b6542f5759 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00088.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00088.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e8f55eafdbe99b495be31444d9e16e57b9b2bad1 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00088.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be68655732fe5d354dd3df29c275bb44713af5634d1a2f265705124766337295 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00089.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00089.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a6b09e078da0369c6858a337dd9329e7d908feed --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00089.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3283e3c8585520afb8f8bd9bf7f7689496d5704279dc76671b05ef732397761 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00090.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00090.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..dcf241afc842de915b19dc908dd8239292f3ca96 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00090.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8648c205d4409ea09bd82cf42ab7f0357c9fe9227c2b94a462be942ff55b2975 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00091.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00091.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..54bf5567ee640611ecf2a50c5661de8d363a5c60 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00091.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:831ec9ebd6b5c501d6f97608df21c1efdd0030d315beed6d3ac7bff716449433 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00092.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00092.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..81ee95de10aa4cb2cf830ad8e756520812d401d5 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00092.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87328eeac8ec28da1681f6d46f2ed557cb930bde51f8915d4d02c77602a5edb8 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00093.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00093.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..153858286d321ee10c5fc20b1c84b807d1e76d16 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00093.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e19e69cf0877a043c425c8407a308eadb53c11b1bace3700feb4491ee84eab92 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00094.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00094.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..37df3567bbbfd1a318efeb52e62ece20ed6c8666 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00094.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a91d8a40cbb2ded90c76cecfc52444627afdcd578764dc8247bed2078855a56 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00095.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00095.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d3edffc86a0067797df91217c11c408a67ded6cc --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00095.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29bfad8cacdd568c226395092ff54fa46ac1e4e5495877b85099fd2bc2511577 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00096.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00096.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3efc17b6da17e50ceadae1bb1647560bc8f460d7 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00096.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02fb03b08df9cf83855f4aab7e2d8d1bbea757cc8863e2baabf619a27bb27973 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00097.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00097.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..65757e59262317982de1ba76852ea226cb2aa128 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00097.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fbd9778fc085fadb9f976e25ef28544e0d1b4d769b14d32b8e3edccbf58df996 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00098.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00098.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..fd3b79d9529693f4766675c29ae9b42b4295e488 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00098.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ca03bfff5ed1f17807ed887bdc954835480ca03a7ddb85396b6fda6902b0af5 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00099.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00099.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..532d34d6fd6f604c42030b7b6d11823097c3f7c6 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00099.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68cc41341e44c01906148cc2f277bcab0b4aee2040543cee3ccc91ceb74f47a8 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00100.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00100.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2c6e8641772bda40f5e23d98512a52d7dbea9484 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00100.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49472c496b443cda637f04d13d0f5714256a2f1414ddd1838b57803fa1e92c5f +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00101.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00101.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2ad6f2d2e54e6338912bb3f5a259aa58c8f7dbd9 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00101.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e7a49bf8c281842d7db9c935994abe3cc73673a863e464b2deccfca12f23ff9 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00102.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00102.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..93219e766366cc6e3d3e3a7235dcac3e7863dbd9 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00102.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f8cd6d26901ce891be8efe08c2b86ce31f4c6974b47037067a2018b335f732e +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00103.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00103.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2dc496876493e7e989fcae885d227a709429827d --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00103.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae09a612388494f5f66e795e41d54ed41d4112d2655e0be9e7990ae0e7427223 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00104.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00104.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..055d7a2741f437bc377eadb6f854f66c5dad941f --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00104.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86fc70a94a5b34fd83944d40cf99e1023fc2a87a94aa8a06f401673f5c591fe3 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00105.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00105.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7de4aa3a904a2a1d4c9954f06eadb3774dc6f996 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00105.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5128de093e863c7c34c33cca7a5bc004b8837ebcd42686a83311f56ec14f27bd +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00106.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00106.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b3bf60e2bff112193002e2ac50a382f7f0829722 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00106.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e378a7e02b02eb6326b407f68297dd433961dc050ba3c7cf6bb200545f756b38 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00107.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00107.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d79bd5d293e02bc2a28bb080368f9d95310f885e --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00107.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75a977ed64f8366537a8be5580e29cceb5aeec0ca57150a61b7c70b6fc5c9da5 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00108.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00108.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8329a795086c70cb0b94115cb6bcdeda77af379a --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00108.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba31dc4d00fe507202b9b03d68f070c8bb9d45ce4f58b12054ff5aa38a231093 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00109.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00109.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a12302c7a5637522c264997d6708c69cc53b1b61 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00109.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64a94561d47cfc0c7ad23e898ae719823c5300edff3b8f25d5bdbde2263468ef +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00110.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00110.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..02c982cfafa333dbd28622f1d4e6c5bb8720e927 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00110.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69b5708ace83dc3b9fc2a6feb9292682fc3a0df6aea236428addb24174033764 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00111.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00111.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3c9f4472474744248301e7746c0130612c1860f4 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00111.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1364c9b855eb24283ee5631cd1cb2fc42d425046d9d4cb564073aea02172270 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00112.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00112.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..435843ba5415c82af25768120597d84027d9ad0a --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00112.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a87509aca617169959cdcfba89cc9b4fc8cb45895d3a1a9afe69be28c5e415bb +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00113.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00113.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c3d7dcd6a5b6c7690e098c5def1ccae225f51b71 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00113.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:156b6aee9c5c01ca9f3c33a43c26af1603432a961aec78f22750163d3a8b46bf +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00114.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00114.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4f75100e62d1d0db587201d0c2d7ca446348ea80 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00114.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ca8d15e5a398e60a91228b89032592856dcf0e95c1b64307cb8b4423ab29af1 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00115.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00115.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..750c7d115ddb3b30a3eb4febd2434bb58b0f33ec --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00115.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6785dfc1331e4df56442f91d996184b73ffb1d39e128f88dbea48893291a9326 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00116.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00116.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..84a8707b8a13ed252baf0344a2802438dc1305c1 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00116.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:597e9decfef482972c7ddd300920f66c44722a2296f1adaf25aee82e6239ceb0 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00117.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00117.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f30e35ea85ee11b8b538e6927172ce65d060087a --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00117.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3bddc15301366e26ed071fecff0cb9a0e475ea81dee7bec3365b88cb49967895 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00118.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00118.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4abf9876d50acec94fb83d45af1f892fdc00a09a --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00118.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec7521763d65ed94d2609f1dcfe69e9dded3c9cf749f3cac7f680e4349f9a342 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00119.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00119.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ffb2976ff9d1acef7030bbdb3bef5c96b639b9cc --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00119.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71cbd4cea86dbe859709c1391097eeca0f46fd08c91390aca9d184ec6a569a81 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00120.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00120.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1b618a6e77b0bde3c21b21c0c0fc9cd24a587446 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00120.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6baa42bf5b008479fad9c1460a36be8ddad09063af3bb3bb5626673cb036fee2 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00121.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00121.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..61c8df1be67e747956f75fa1006b00611c7c3391 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00121.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4008f821b27389101021c4c2efec23ac783bc3d523e4b51948a06ccbe2c74318 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00122.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00122.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..67b6ed50d8e70aa30670cf38c95ee73f4b10d8de --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00122.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:819edb766850a2dc421023bf36b935bc6f2dd9b6207f911a9cf87a7ef285ad0d +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00123.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00123.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..20a7ef4a5548fb9eeb5ae02a04622edc3ebbedd3 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00123.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e6b11994aa7ead24d56bc41a380b3f2d5ebc391a365a0d13c05fb915478624a +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00124.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00124.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..67d352db277a8d909b7d2af832d2b2bf376025f4 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00124.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9cc5fcc36e747edcf6eefdb69fea2443ecf21b5b0b5838b7682b01765c3d78e7 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00125.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00125.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..fe29069d654df7ab7a25d8bc575f8d497a1a2e00 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00125.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4963f62fb0a7e034094b9bfe6b6652eb949676419208ae7cf0db274b36339cf +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00126.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00126.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0fc1b8fa2224d051a6cac5c30d78a80ca9aa0253 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00126.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e45bdb292cd6e49cb92b05e45a42ae017e1354dc27bde16c9a29e2781c1ceff9 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00127.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00127.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..04fb6fba804759fcfa9620ff51a8564a8677d6ff --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00127.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:668ca67b0596aa77a126b62ad83aa1efcb914d5166d37f9ebc07b09a882cf69a +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00128.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00128.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b9d8ca2229bc15d3b85a1cd4ad39b921329dc99c --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00128.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5fdb1cadc0df38db1cdb10dd18755a65793c8cd305f1f04f19b0d9cffe034e82 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00129.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00129.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a6d95cb5201768508c617cd905644194b85279af --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00129.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea455fe4aa6ca5ee4851df235ef79b6c346dfe63fab53fcba8917397808a09c0 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00130.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00130.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..07cfe836142eabdee61ab096a2e901a9efa3f552 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00130.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fba03c9460481ec9b87306bcb4cb75d4f61004ffd071935f57cb176b71f73909 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00131.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00131.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e1ea25e70c94a7ee08a0c3bc85728f01ef6c438b --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00131.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b019406208085bcb4b1b23521c9f16e59a6e4d7a2d9ccba7b7b514f7254acc5 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00132.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1e8db9b7dbe22334cc49927c30083c58c65ac971 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae20d8b6fa4b60cfdf93487ba10a7511df4a7a1cc346744b1c0531f3699466fb +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00133.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00133.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c8029e32d7d7bf3c060bbb17367318b14da7c8c5 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00133.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db717d6d2c90fcc4f886ba6f3826bc7ba8b8631b8a414fe900a02ecf8d87b7ff +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00134.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00134.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..953f6d1621004a81594ebd8b81dc41eb1199391d --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00134.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd314d3ffa77e7ed327f76b435eca69d210b706fb86dd4d4710b60df09996273 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00135.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00135.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..bd06b3e0e4ab27407a72aeea714f82a682566d37 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00135.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16289ce455ea409a2cd901837886a1eb66a2afb0ef6f99b7f2080c35e4eb170b +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00136.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00136.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..10cce60a904b45c72a2a7db844909fd690aacf4a --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00136.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ec3feb9e9cacfe90ae5ed3e97e76a14b735dc96e72009a52e5760db2f19a958 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00137.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00137.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f837464edbc031cafb69c18b59cb2bcfab9c97d0 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00137.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8b1e1efdf7e8140fffbc6fe90a3c7941cfada85d18e8e91f1f6e7f62e6aa11f +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00138.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00138.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c8b2105e035470ba60f78948a31d39f8d1236135 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00138.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f15cb231872c76f1707547c97afcfb0221fa3ab9fe08804770129afbc7fcf9d7 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00139.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00139.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a15f27955a250b159440187c965061951a01bc27 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00139.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16cfa98b77b9e5342cdcd1a50cd49a147c138e5258f64a32007d68439eda9dc6 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00140.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00140.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4ee6a1a3646f9b04bf4ed8fd9c3b0fa0e53770f4 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00140.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c82106fcead28ef7d3f5af113c26cb5fdb7cc8908384e1013324e455c8035a46 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00141.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00141.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f9d1ef8bd56ced96660a109c8773a679b3ccf8dd --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00141.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77193c9d336f8e51f6081aedb5b63233132033fcef7b90ff5ca657a3273c69f1 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00142.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..edbbe810d528f39697238a769975d58094bec875 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f4415d05871ad50702d961207ab5dfeb65cbb048e83797984ca8389662149ea +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00143.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00143.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3ce33ead95f3980cc5036988cfe109b09bd4a855 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00143.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59bf9409e4733fcaaf1e68a64a6b054febd919fe47b1dfe344b073f7ce3a020d +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00144.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00144.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5d3309a5c3ae9e94c994454386a1826705c20135 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00144.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5ce97648c199cccc03581700db83f5a9789431f106c4a50bd1e2a65e1068e1d +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00145.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00145.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a8018bcfb95de69c7c00e0cd3e0da6b5060e15f7 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00145.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0baf6cbeb721460b46dd3ecaa50e004f7fe4309ca35ccb97bc06171ac33c1343 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00146.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00146.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e271b195782db3bebc6f5f8abe187826187608dd --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00146.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33bc4c934e6e83f39d63c0d15a9a08f01a6059f815202702bfcefac14a5ea87e +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00147.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00147.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f59f1ca84730e57751b1dd7b27fcfd65767233b6 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00147.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ccb9d4fdb5ee48e5f343036885176e5c0230f18d70c7d0ba6893e87211a41915 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00148.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00148.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2f5c1c08d0ccc1cc1b2cd2cc168f66cc145915c3 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00148.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eeb40f63fc44d096cd35c44747509ead0f59cdb97f2afa436bfbfad0998651a3 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00149.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00149.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..26f4debc056128b05cc1aa9ae97f321530515d51 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00149.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3bcb123541c91be84b979f0237242eb3267c1a6b6008c029d62bb41caafa3e46 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00150.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00150.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..fef38dd199ccef272712168e5f8f7301833866bf --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00150.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d1378e178ee8ee39385793b40dedc4bebe1c46b8102b3456bbb9c7a6fb8244f +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00151.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00151.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..56aacc86b3587987b67c52c13d12d89e620425da --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00151.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43d158f144e098e87578c98dd74e5d8616e2eccdc4b147fa5e02afb27e7625ac +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00152.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00152.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..945a2515f944c8dd8d0f7d3901b46e8bf2d24549 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00152.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a6b4ba9bd7b8ae8fa35c26384fe497296d885f8e4b82727ef8b27ff8316dfc3 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00153.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00153.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b59a1cc8e859b0622d000489cb2b9bc8df7b767e --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00153.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90453ddc0b35204936f3e4a4bc21c6b5c2d45c8449f626a09d7c39c86332bb9b +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00154.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00154.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..dfee062c6e894c65332c7c88ffb78665d4dbfe84 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00154.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c65b12fafe2bd52cbb5f38b49c660d8d662fd8c5d80b936ac82a18b1fdfebd80 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00155.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00155.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..108cf907f2f083874b95038254e18b8fd3707aeb --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00155.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:562e7fa028ae8ad8b3f9bc88b7211de354eb1eb816a21b718b1a15433042ec8a +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00156.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00156.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..055889093e1e8f3162dbe264284a4223926ca523 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00156.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94b8669ef733b9b1c5144ac6b5a827c4bbed9aed3c164bbd80570b55cf8a537e +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00157.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00157.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7d252d55b1ac658a5400deb42ab40f74f2f38903 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00157.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e24b9f82d6332c3e99f06b5efbd6442e08d51614f164907e456010fee52d01c +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00158.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00158.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7bd3a9f0d8c2a552d460f65ff3c86ff39cd76c93 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00158.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29b101ffe4bcd586fbef8cb0ef893e66d8991cdb252ea27884ed68661da00099 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00159.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00159.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..beb38ca0bfad820716bbc7185d15d6a3df0b7c65 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00159.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b3058eb92233bc046d2311be266b635d1e1daf39da866a73f4b9c7f33156cf2 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00160.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00160.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a770bc877a96d1e48b81648be799507911dea057 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00160.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd321fefc201796810a5a707eab0371610c360aabba358b8b33bbbf01a6aaa7a +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00161.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00161.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1caaa9048b313aeb95685b65babb0031fea48bd0 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00161.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59b387e14cd13bd7b9587f47bf0391d58cd5cfd644304e33be0acc50c1731624 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00162.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00162.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ed34013b92e11a65d196ed268dd3ad5eb04d19ca --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00162.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bdc90feaff0751a22d0216bbbe13da3bd52f4c134e1ffa04e5c4b20dee8c5d84 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00163.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f928cba4140053d0e6e9347a010319a5d4771f3c --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8dedddd413da2fe45ef52c836c77cb8a48ae9c35231fd86be97ece87d1ff680d +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00164.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00164.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a272ee4ee4c80e5a5e7b5a5920c2e0f165cf4db6 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00164.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e29961b7981630089d891fc6a4eb8c5cf400707863e94f9f42cd66eb5e7e2209 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00165.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00165.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e7d490d5086effe8102b1fdc5c862b6b151a9c34 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00165.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04745f45e2cadcaa11acd66c06afe8a6392393c13f9eede80a247a376367cbf9 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00166.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00166.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..814bf30de0d3375692c754662ff56f09700b094f --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00166.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb3433efa16dd73861e0c1e3f33446d66e1492d64f15d748c04bab7df6dd52e4 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00167.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00167.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..fe9149027e46b15f12d6df5b120249c42cd560fa --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00167.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee0da45abbefd8c2feb4c70bd4a7beb94827dd4a91494595e80bb016eabdfc7b +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00168.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00168.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..547cecb4986e2525c257a1d5ba1bff68c8f4e44d --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00168.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0da9f0a5dc52f3f03d0b009e83f00d8f9ec1e575393df59f9eba38b2c3b3005 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00169.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00169.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0f19b2d492dd3d0abbde6aba7ccee43b4e9ebf01 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00169.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9bcdf004b01ed1e285432484040e32f4bbf5d66fa6dda4407ec333eb539e177e +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00170.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00170.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8b4419bfc5fec415651c9110a65b9f59b6b6e465 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00170.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80650f4f8388f7e96ba66564a54f1566f86bbf1965858f96e900e9bcb12fb4dc +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00171.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00171.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1f44fb719ef9657c177e5abce686c4c4f53bcbe1 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00171.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1c7ec8c0759ad27c3f5ef2250079808752576ee77ec09b948e51c0e4b45fe78 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00172.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00172.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2be8560911b5ff279a624d764501407b41f377ee --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00172.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3e12c72dcd9a615e636496c6acf103146277950f3bac12e1b90140b9dca6c79 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00173.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00173.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a2fc12ca34558b6c6d4c66813cd5dfdc0099f027 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00173.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39d0f1cfc7fbb4a2e3ce3e72ceb61f53cb1d9976efb3e8899571bc5c82e5782f +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00174.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00174.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8fd1fc99fd4ea29d811f239f7f86a1614fdd8e5e --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00174.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9637e332791fa4898706503600fba6049eecd8ca4b7b753cc24b21b33321b767 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00175.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00175.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..055bec89b3871601982bd2fd64180125f210dc78 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00175.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77047ca3336b87f279bdd6cfcd1ad76c7d2949a582538b584b0b9355a6b95069 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00176.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00176.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b4055011eeb070a223a0d13d902201451c4e7efb --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00176.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f266469bdb8ad2b598897f5f1a24d5a2f6d69e109fb275c7c0716a287f7ecf2 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00177.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00177.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..299dabaaf954759ff6ea7c9eebe2868e9595b6b7 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00177.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc4b5e2d013e655d84e828f22cd6f6c70699ebf5e56ef1a46e8389740f07514f +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00178.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00178.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9cc1e16233099a5d98170746c7d126e093746454 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00178.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18ba2c30b953b06b0c9456554967c5011973e3e3b7bb415f50b0114f5f561d69 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00179.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00179.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..146eb56d8d0a692a1af62d5982fac9420440ba37 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00179.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c87676966786e536278c4ff700165beb941b87352e21b67d21fa1c061343189b +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00180.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00180.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5ad190fb013ae8c8f3629779f742466f28b5c8c5 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00180.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74bfd12636a3d47f5f395b11fdeffbd82749abd8cd8e50015fc450a54620ba8f +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00181.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00181.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..69a0d1e25ef30b07efcf52801a891db8cc97ba36 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00181.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4ecb3b3e6a67a44fe2a7fa1a486b53446553fe183f697934da1acd8a6aa8b75 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00182.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00182.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..bc7445f9f68d0d38693430584ed94bda3b590b58 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00182.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89acfe30869c49fab8e01e1a509e5e54ab2d5f4d1687fd14f8767a63ceb932d6 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00183.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00183.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..78420d145fd46e791234f7964b8b13715584f02b --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00183.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:418632d42a313184a5027ceae95bc8d54b922d5f77400a094c84b2c298343f30 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00184.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00184.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..16e840973f9f25174a35acbbf1a7042164b9c882 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00184.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed613f5f02b14a8fe6efe7f778d1af5138b3285f195dc53c489d06b77fdea050 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00185.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00185.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a5addc31c5025fb2a56ecafe91ac2284b40c106f --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00185.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3fa17f4b8d7da4c1c186eaf4e441e238c00c89ab90fafbb697121863a4284cc0 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00186.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00186.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0364895a685eda384bed392e91988abdf11ab1b5 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00186.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72050cac9c7d0d6f177b18cc8424c7159ea2e7facc6d307a1e23c5a44226329d +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00187.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00187.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ae477464b2faec86e249953eb03b2ff0cecf0d0a --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00187.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20446140740a4dd33686d9462c6cd8f58334071dfb0334a34faf4e44806a0e4f +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00188.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00188.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b3627cd6d43e3560a09ab081dbb61acf35d86490 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00188.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c34757ec7b8f42c05079133c335144d6027e3acde7761d29dd193533e620e893 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00189.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00189.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0f9011840ef66cc3795f5f1f36eef44864853c4c --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00189.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a24ab02806b1f2b966180e212ce501f407f2152730a5090f7a50b8f06844fc08 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00190.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00190.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..bb4245a4ae5fe54321a848b280b583b1f6c1ba6c --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00190.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3fd8a78d3d8f1ee3fae8537642935881ce4e9553edce2ee322af9513a84437d +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00191.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f56b990750e7b5ae1f0330801df12a9188dd224c --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db6b1f85dff9a31bcc505b73eac9f5201922c96e70061271d4f898e7962b7ed6 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00192.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00192.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c4eb5bf1430812d3fb2d78fd55ec9bb0ece8834f --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00192.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb50bc52c8b5a8bb7be3b0dbdc16e28f025c9ddcf21fd31b76216a3f964365e6 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00193.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00193.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2f8765c794857474169dcbc107416ffc25c457c1 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00193.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f36602acf62b46a2c9f9ac410615e9d3e734756c50f42b27ddbdffe42a46e921 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00194.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00194.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7b30342b32d81dd515a03099ceb3c973823eebf1 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00194.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a865b1278278cb1dafe3dc409c0e0bc99fbc138c03cfbdf76f6739203cd62bb0 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00195.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00195.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c131a3e6230ea10a2f8e91b6664c51a9b94143ec --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00195.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1784590b37dfdbced32f1ee91f62a7ac518a7540891acf8933c2d042e0dba280 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00196.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00196.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..08584b4e0e085a64196fa048fc3777981d68e91b --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00196.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ccea1fa30e9acba9bba153df504a42aa8da136b864049b3f8d1b987c03def33 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00197.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00197.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7ca265fb08698cbe446eeb9ea82fc6a56890e216 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00197.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bafd7d2c155ea03c13005d1df0df4b689b3ea00221ff2d4dda09fbc95665c1dc +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00198.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00198.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..72e35bc66e847a49f8f2b6dd21f6e2829465c9b5 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00198.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12d4237675fc40250581f995b14fc159cae0964410ff5ec8af6d6fa1491ef010 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00199.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00199.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1712692cbb57e18217de0c0a34666b3f89af44b5 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00199.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04f113073f665923cfad41e9731c5d89ccd2fe5cc8f19d9fcfab998b6c8206ff +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00200.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00200.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5bafe15f97a5253bd2b17bb1d26ef8e79ec8c139 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00200.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:303b874dfe890ca68dd9e60ec788c05fee4f16fdce4c92e9a221c6cae8afa292 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00201.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00201.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a0ae896cd34b541798b2d1799a66f759ddffcd6e --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00201.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:905329e37dba5d72233e42fcd16513df0e0e31b48f54ed0b483d749eec646973 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00202.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00202.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a31fda9c1b4a0a2aa11717dc3747f8c7eb24b4a7 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00202.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5e79ab189c258e9bdd9309f1384a591bd0806817e05b53f1a1ffc9b5e904504 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00203.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00203.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8199662093ccf07aeab146bf9b90ae6b51307b2d --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00203.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:688c7251780ba54f8643bc75ecea2be56ac3724a68754ca1d6429c0923b767d4 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00204.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00204.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..fa2cb315867d1983f1b533079790e91f5ee1bdcc --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00204.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc6bc6f45ef661e447a58661043ed393d514644e75520c4838057ea04c67c46e +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00205.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00205.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f13418bbe86f263ab7626a803e1ad2e72ae86807 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00205.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e98be14007adcc9044a74cf0b744d0cf52338fa8e7489013657afaf0cb176a2a +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00206.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00206.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3a94ab8be859f0de84ed76c13a85a411673ffa05 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00206.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2310a8a420f45b0888b1f915b7013de7b4386ff05a7bb0f5b771e281c2604fc2 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00207.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00207.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..84979c414a275528e660b70700bc3ac4c0a716cf --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00207.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:570e75f77e901354c7d03bbab5df6ca4f0d575aee46d12fdf9d8b338f3193b9e +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00208.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00208.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1c554794f72208217073767e86ed55a5467083ef --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00208.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1d9f22f2c9c600a019808dc216ed54ed25a0d6054229640f69a3a6ad2a03700 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00209.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00209.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3aa87330271981d6cbcc9734014193f51e8ecd40 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00209.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76efb467c01ad2b0e8b7d8e4914b6c9ef104a0c8b247cc09b63893df1a44a098 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00210.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00210.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..daf7f137b5918854ddb5b40699c551ef45c7a485 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00210.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a86e3cf92f675d8641cc2a8c2ee5ceba05260545e0b6ca8f596a954e0249308 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00211.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00211.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e433ea8e6f8114e53f36c5636d2c602929098c72 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00211.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fbde3d9721bc24949eb4866786615eb1dad9a942b7928ed23d0f6ed044c0fa88 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00212.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00212.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c2f8bbf96d121e4ad58d57a6bc4c9927d1dc638a --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00212.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b5c0656659ecf79336f0688579ab5343cc75546ff0f9c859009be6887701e50 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00213.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00213.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..08ddd26d6dbed47eb6af59817921ba380ea8e760 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00213.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:446fb039550f3023ee949f5c061e923046c33ae388ae8d8e31a9376bfd7b5c3d +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00214.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00214.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4473179ab958a6d8baedbd1cc0715a4d7b17aa4c --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00214.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01e049059b38e32f0d07b5c9e7ccfcb536e80404a5bea0cb26468b4fad81255e +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00215.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00215.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..aec0935ec96ce7c58884d5d4393cccef54df6396 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00215.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d85e21380942fbf80c121a7a30ea704d69b86e51d36963387ee38aeeb189f75 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00216.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00216.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5d1e32b47534547c2d247243e9ee92960a9bda45 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00216.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c18413ef663b0c6872c56ed661314ee0798a9b146d7671f16d6df70707dadcc +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00217.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00217.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c4851f84957b93d93a7695617773522fbea4bca8 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00217.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:978bd6c085c19901adb09e6db92fa93c2007b912218ce9917e93ed2f379ce653 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00218.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00218.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c5b03d14da81de358d20303f1c31a772c90169c8 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00218.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b7731b697493bcdc6f95bac4f66110b788150408855ee3d89fb3c5581374c20 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00219.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00219.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9ce00d212178e9edfd53f77ace9ad851675826af --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00219.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7fc4fff8e361fec7a4eb1964f11e796238fbdd36ca6921016093acd5a4c18975 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00220.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00220.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..cdba4649cd66c2f1495bd5b0b59bbc09536797cd --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00220.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8537b5168317869997e306165a3c37b453621054b380e12d004a3b0ccf2ee0b +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00221.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00221.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..156d2f1abcb8efed41349084bbf15827d46f6304 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00221.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3dfe1af57b9f73c29e671110b61a99f2f7375de1189e840b5e30dd8b68dd55bb +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00222.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00222.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..aaa0ccab1b7f679d52e08266996ed0e270ce767d --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00222.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee99a620a48abe43934340fba60eda1888f7a35f59569004e412887de03e3be5 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00223.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00223.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d82980784dbc99619b6123302894e40a8487083e --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00223.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:654455c51b1240265cc98ae4b76955d84b966bfe5e468dfafe82c5e17afe5511 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00224.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00224.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a10c213397b1b31e4f5bf1347dd581a83028fa47 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00224.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f85c51f5d68bb7e31926aaaafe3043babc8eca40d3df84846053725b48dca67 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00225.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00225.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e924314e2896bc5dcbc728f176e56ee120747368 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00225.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20b2b888f0a3b4ff86452d82c8665d26b654a296ccc8c2dda79f2f5a66af7d28 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00226.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00226.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..960a1c704be7057136e668e23845793b95b9192d --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00226.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e161c3210eb86e99404e61ee464200fb8a9d7ddf3f8024dc143771787be65349 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00227.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00227.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..19a5b9c711965a7ad1ce84d6b4705ba0af3765aa --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00227.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:47b694566d072cc85e8c35fbf4f2f0d1d7d793d640ed3c85e789eb3fa9b9baf5 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00228.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00228.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2e630185fdb4f1178bd2dc4d2b280e14e9591354 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00228.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53cfb29a26ce2d97804b7b1a67f85962ced733f17dd6c311791de49a8478f2c6 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00229.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00229.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d2e5b3285ed0aec14fefd7f93790a93dea0f9818 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00229.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40f9ebfdf03582580c704927712cc5a02e4f92b57c37693842ea9d572db447a0 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00230.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00230.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..20c5aacbd8e192caec247e987569335ba5cc81d1 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00230.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6dfd6a84d603f06bd7fe8c24189837b763d5d12d47888bf45dccc6cd686f04e9 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00231.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00231.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..059094ee2a0880689098e2adcbf32225e5aabf3d --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00231.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4780c31febacb5f645df9329b9eefb28dac2811b7c6c096a943984187c0da255 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00232.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00232.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4bc632b7c0d0fbaafadcb50cefe3c89923f9f7ce --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00232.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9885137ebb974eef7ff0018b4828ba1298d484335791238b522fcc894ea4a949 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00233.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00233.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5492b6cafb9e26fe596d1add2162732de698f713 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00233.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:169c5ca59b80ad3be0b6c73718dcc4ca0454f529ce455e4557aebed27fc3e46b +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00234.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00234.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1b172fb91b482ab065da59534af6dffe7d3547c8 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00234.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7d7081b03eeb28a9a75e488c89375608e4be74eafb1c2efe25d24ee4c3b31b5 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00235.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00235.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..21de391e7905d2ebab804809664c72a65e7fab56 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00235.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a243acc866bfb563e44951448175c1b27baf3bba89b586afecadf6c87544ebd +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00236.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00236.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b8626b2db6a865a3fce1a6bb38e9c25b0009cea4 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00236.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59fb9d356c093fc6123753ebef40571dd086c3a270fc9d8e9d69c962740e2db7 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00237.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00237.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..df7ba637f0671611187db445ee8cea31c88c79af --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00237.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4ea4c07bd491bb843ac0799f3854d3c4a461ce08e8c515728be187f6a43ca7a +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00238.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00238.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..930084eb977ddf128826e9d2a420f724fcaa4481 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00238.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e2161020e75a2c14dcc81091fb5557a92acd3ea22d827d09fac6ec73830ff74 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00239.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00239.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..dc67215041d8d77a9b6e040da6b2ebf4c894a87a --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00239.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:306cb856c35ac9f00141577ca92b23d6ca78c100bca3da1e51bf2641abe0db46 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00240.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00240.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8704f2170e421a5ad97cfe68a3e5dc35c5769a55 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00240.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59766b14177bb6f577d2f20e2ebda1eceed5f0c41affa0e18f1e3dbb6bd81097 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00241.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00241.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..51fd061bf021d083d72830c2300e255b68ee19d5 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00241.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0127b0523e83a980007d8bf1dd028949c8e3fe2975d8fe06b88c80849ef44ff5 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00242.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00242.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..cee1ddff4fbd7376b52538517458cba6755a105c --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00242.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9227bc5a8681d65f88ecf2829bf748ded443df7383a571c36a64d90d1f64d17b +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00243.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00243.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..cbf65197fbcb882fc00f218cf07de2b627962a72 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00243.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55d4acdef95f25297e0bf6c4fe0630d5815bd2b8539267da931753447dbf3a98 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00244.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00244.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..04fad6d16be7d5cae25849df1acbf60b99817092 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00244.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b77127bfb82ab8d73d1c0e13345653e21f5144799fbfc2ba3d34e8e31764819b +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00245.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00245.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..fdd7672c3979b64056348d85c40b9a73bd131fa7 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00245.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a328753138331e5f1081a514fd9b2746755ac7a0cfa96fc7c32cc571b60e8eb +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00246.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00246.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b52bf41d317f06298b011048888726f4472a69be --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00246.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33d60f8de1c1189be23975961c9058b18400e0c03fd57242c37da6c5b39b0089 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00247.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00247.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9e62c2122867d2cd505f762ec5a52905e7316e8a --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00247.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44678029e72f9006e3fe896e576dbae2310b350d6f35032aa0ad076b3a26f43b +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00248.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00248.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1683b617ad5e51cd2b92130b13f32cdf95eb192b --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00248.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4244494ca5856bc599f7b6407a88cbff00fdb1280b4abe69ada58e57d7e5636c +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00249.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00249.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..dbe6df12ece170da5bf2a8d763d5910db6866b54 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00249.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67ce0493a3daed3b1d8acb1e7173d0ae2be5e372ba839c55f06501c4db4471c1 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00250.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00250.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..bdf505b12f2518b01ad975163f253a326e516d58 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00250.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d552e2cff60c95bc2b3444920bae93ecff69fcf2d04a34749ce210f498dd91a1 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00252.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00252.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..084362634c7fb43c4a754cbe4984d348796e6853 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00252.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:564972f3b70b5d64badd7b114ba9c4a65d1459771be8617d6a292b1b714d5786 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00254.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00254.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..472880af12a524dca08d99dfc7c70f8089b34644 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00254.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85f3efad086836ad69f7fc837c441389d4efa82df291158746b552558b9db818 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00256.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00256.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2019cb633fdea606fdc5841a648c89675ed6ec14 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00256.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d2c87d8fa88e0a1e7a72ebcb542fd560fba47d1c84661e514e79460342fcf25 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00258.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00258.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..145e4960b3c1f95e485cd6e006ce0482fb28620f --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00258.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16bf506d288cdf46c8339e5a6010e9f12bf5b363bff0651579a3ac4cea33ca05 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00260.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00260.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b61b5ea6329eb79dd2e000a283144340f0a0ee6d --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00260.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32c731d8e81234114ac779ae583423e4c96bb3c4d6a30044ce1236a999d819b0 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00262.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00262.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..68365731ef25c228b72b72730e0ea5c3af7bbe4d --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00262.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17a266b36f6c1d87104dca6d4335d16c68205304518770deee993c119fa2ff82 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00264.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00264.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..94922ab7d54a43342d833a3df9829597a414c323 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00264.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed42cbdb291feafe32877ec036fac1e9a43eeb2e58236028ac36e4b54327e711 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00266.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00266.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..25112106d294f91487c36222b166ad458298d62a --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00266.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08aa076b2b3ce963d6e30197a90f646e557e0d1e96789b7bd6e826a9e7ccf617 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00268.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00268.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..dfe66646811a3bd8421b1fa05f5c079d227d4498 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00268.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:803bc909ae67ffcfac94af1eb30733bde2e03b6bcb3f1829329f7c05c419f2df +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00270.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00270.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..621723622cd5a74f76c4e7a41a9efd1e1c9beccd --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00270.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7ad28ae053b9e38d9a4fdd7aaf4f45b9002589abc16248d6b26d018dfdc3d3b +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00272.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..52c83a70dc0db640c2ceefb11e0e18fee6e09267 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b287dc67efec161d550bb9f4998e168a05ef773ca86412f7e17603243c91d40 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00274.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00274.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d3c8405acd15342791b884dfbde985191379ed1a --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00274.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25549bf7d55134e0d63692ee25a20ab4db4a27acad86a07011a609bfaa9ff1a6 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00276.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00276.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..16fe9cea84a4e71bd0a424259ee6fb3f22153ed8 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00276.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d61ef1529cf0940d9d856498fc5894cb9dc233047c131541c0adb6d936cc305 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00278.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00278.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7b40b386cde2ae58efe25d692a8f17a96633a2fa --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00278.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13f2d0f5eff92e40a91c7210296d86d156201c590520b9c27d7bd8bb64c8ee45 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00280.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00280.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d6e858fbf178452eae7244a2e1aa62063ebd9695 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00280.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee5c50031ee7bc4d93944cad44281acfca582aaa7120f5a1be6f6e495e22504b +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00282.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00282.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7a2f6295093a46f33f523437c9ce6cdf336b336c --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00282.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:941c8408056f2ef0c908b45b27f9004e19affc0d4c3bd512234d942d05595863 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00284.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00284.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..46a8482619ddca40b83b161615409f87553f3716 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00284.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:474869190ffaa0a5b9d7d7f145da513c11f7015071891aa064c88368c27f60e7 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00286.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00286.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6cb8b0aba29808c5aab244b5a9cf5fa41f052824 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00286.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f05e00b5d02a4c1d21b786ec1285ed62b2d0ed6e1aeb4f820126ed5beecee91 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00288.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00288.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2ce5ede8b2e06b798ee887c0c8c66425c8ae8f25 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00288.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42dd4701ed6e9ad3e94e6c5310ae1beb348ad3277bb9042884c9d56d30d28114 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00290.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00290.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d3300fe05152785386519f7cb39d8331e05df9dd --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00290.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33c5f75d1916ea87e0fd80b4d9a092d39202429ce6799a4ab6dff8a2ba799d86 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00292.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00292.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5f2ab1f9a58291eb8aab73e2b6fe276b904eba31 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00292.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f544accc42349b6c9d1986f5baa452bc7bf7ea407ecbd337e44a62ad346268f4 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00294.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00294.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..147073969262acb00c184e55542cc1670ebf7db8 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00294.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:919d243625d1d62081f22d49d91e3fd2aaebeae1a18120940060c2b8a67e21e4 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00296.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00296.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c27a6c6f9e0a155c91fc70c0d81a857ce2661b57 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00296.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5c017cc8671ff130d9fb8ff1c460833fb655e799c0ff65d8faafe9cbe345230 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00298.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00298.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c1d47d5d5e22227ac84beadddaf1b44c9792f62a --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00298.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:136fea09c5b25907af8a6d1df0b40f569e3a770eb1a7902f2a4d5bb2e2e294be +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00300.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00300.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c7e02ec43de73e0e790b919cfa794c6fa6546f70 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00300.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1453d91ad6c06c8f398b067008e27d1679a741d765fd1eab3c3c4759e33d4a50 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00302.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00302.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..41adc4863d5e73c7e2d436cf865012cff8a48872 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00302.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f0c03b64fca9c11210e31ecd3bcbe7a5b51411f533f798cf2ea0be720bce7de +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00304.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00304.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..759dcec4f27164a0a43ea7fce9340e4a52ca5768 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00304.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e72099f278bc89258a694d7518ae94a8f6d22e320ca2a4a7572ef6a926e2102 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00306.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00306.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2b5233022ce124e26cbfc9938a95e7a76f47acc5 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00306.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe3aed0203a6578bb7e499bc12c01525a7343b3b1b3dd3315774b3bc9d7c7cf0 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00308.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00308.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..505c7f95b517754752c9e309343b18c42a7aef50 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00308.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:962ad9b08b0c8f058186295d0175daf3a9c490ef144b264efe7857368de99208 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00310.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00310.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c832872dacf32af03a9e208580da5856ddcf8cd7 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00310.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f19a047961269574e6aaccb87abb4ff76a88412ad2c2330c5438094eede529b +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00312.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00312.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..fc8a7cc560774a3a7792208bb4ee22b7c8f4f614 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00312.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8c2cb00c3185502f4a6b414b19d5a4ea7d57470dcbfafd60ffc336716c694cb +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00314.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00314.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5c36f8a3e15c3cc6dfa44394af50dcbfaa21213c --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00314.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea2b76325c36bcf49577e85450acb273695639ba975a83b8cb25eee048ef10b5 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00316.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00316.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7686dd0db18a0cd975186d92d4c0f4e9e1faf019 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00316.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fac18bcf5ef2c3fd724e12e0964a9fb3c5c7544eaca1be139b51ef4b52b99131 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00318.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00318.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d286d07c07810fa9a7bd24370439ca84de6cf6e3 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00318.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ccdd90975051267dc705422b73f3bc15b34b3a52ea7f2d22ebdb2e7e855670c7 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00320.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00320.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..552021bea13ddd1341753ebc847e4a7d2db44001 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00320.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c04f5c49159f2aca83565f0f706575f2e94f211c6168387eb5e2be2ae7ed011 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00322.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00322.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8a9f7ca32532caaa89824fb4418c2b4be124430c --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00322.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7f393f2b786ceb6b84463cf446a10dfc48e88bdde3d1cf10c975eab9a0c63c7 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00324.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00324.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9f984f3dd347fc3fc78699a96bd98266b2ba01ee --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00324.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e643dcd0bbb165217b8fd3b76403b37bca3a7c424ed514a58880755a760eabb1 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00326.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00326.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ed66ad6cd42cb6d896a7f2b9668221b97aac175a --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00326.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:755cbac62cd49b4fa9cb3f072acd862f6598085027046d8f74e014c50d64e95d +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00328.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00328.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e15a096a2447859cb46b89ba64522cc524a274e1 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00328.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef5424a0561ce5f41b07072f8e5d526ae745d5f84c23b793923feac7319c8831 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00330.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00330.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3a13cb14db309f05f181b025b7a32b0365dbe571 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00330.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f9d34a8548e507de483e2bd627a5d79448290dcdc7838a47a64866bb6540311 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00332.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00332.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..560258d46437eb15db76fb708842af04637fbf33 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00332.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:473312eeb9c9ad622a3d46ead60bd410bc9344dc74fb3deb1b567fab81546020 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00334.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00334.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..cf00bcd3672d8de86770e4a36cb5206f15f8d720 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00334.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60a050b2ca56916fd33d015d6ddf730f0396a7ed12a1ed9a3e43da22c61ffb5d +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00336.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00336.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b471b8769aa01db14cff54d9dd9acfa8785b9418 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00336.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2eb517d88488e8ea920ab569cf993f868493a288db979974ba4b69281117ed1d +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00338.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00338.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b481ff2e8b4e20551950d84f6899d430374a4237 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00338.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f14da7082c81eda54771fa1a351c810de5bda92b7ae5fb45b25152dd8fb86c6 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00340.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00340.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a0941d8b15e2c03067aaeff67cd4f03e1cfc12df --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00340.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:100db96331425222cbee8c9f96bf71136d84cf3754c56cde927a9c95ee85b213 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00342.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00342.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f33a7ca8915679ecc0c73332faeb94d20ddb2ee3 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00342.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ebfd31732d230cf4f51f4cf9311792783a4b956a64550de51fb7afd53fe2a8d +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00344.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00344.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..fe800b149625f6f131b5780a05b26e6a233c0f85 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00344.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:346c3c51cbf897d3e1a9c867b63cfed33b6e0a1fa49315104ba087663517b7a6 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00346.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00346.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ab26b526ffd32a425fb27377fa65362c85d0c462 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00346.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be1ddd3e667ffdefe5a2f1cd0e084348e416fa08cacec99c31027f770b9f70a9 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00348.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00348.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4e2b41f03c730d6fd8e313e5cd7906a3878ab03d --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00348.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b91f2e3933f7f246a8af1f75321c8346141847ec20615d203c5b6d7368da9e7 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00350.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00350.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f07b5a73293a73533684be186b2a96a842e57e8a --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00350.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b20bdb004fc7706fc2416be8d7bd814613ed52dd7c35989aafebea87523ea33a +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00352.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00352.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..07b9df61e8afaa918dbab2b87fef1a1df5116a74 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00352.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21a0f05b3560cffcc5489a5f286c2a6ec27ecfe70fa5d9ddb43896616b38b16d +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00354.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00354.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6eeb2b39ffa2b4b6630253851d169089ca0a01fc --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00354.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85805e631d9819bfcab2cfadaac89d983639ca94f427758e525eb2520664db0c +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00356.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00356.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a5ad63f964dd30e4731458b105a82416e6568b97 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00356.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0abd4d4509c2c99cb47eca0725dd4f8e84ea17a5662eb9f2704577ae06fa0d1 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00358.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00358.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..aa0595d6775fe72b9346c7f1ef416e4c51c48ee6 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00358.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:837002cda9966275a065a5ad850d3c7eb7e0137d579eb8f08400aba4195fffa5 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00360.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00360.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6614fed8d39da8af04a084f6c441d2453eb14d00 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00360.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0979d24fdac495577d1d0f34003bbd9312d5324c2002b9ad22598ce9a4d2b6c +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00362.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00362.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7b27bbf9a77282cd550a8cda859a4f1ccfa3c497 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00362.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:979d51b2d69d8d6bbc31502b5cfb188b07060fbb2c7b374f07d2941b3006a730 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00364.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00364.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..afa0e3f11526f0c0b75c7005669178dde116af3b --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00364.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93e68ce06eb15daae6f0599cf6275474549971fcd6231d602aac3d1d12e5dd4f +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00366.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00366.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3112230aa34c442641672503ca2167a1ef52a42a --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00366.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3eb335c5b5b7248f56b619df4fac425b9e231d79dc3516c630d541897916b8e9 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00368.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00368.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..fc441bd26b1dccfa0dd5ae68a6a2dfd7e50a573d --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00368.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6bdfd9db7629905f8a17eeb4cea4f030509b5f67808c2ae28ff55440f1c31a8 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00370.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00370.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ae8f3e1ac4d4b6f9921767ee79daf4fda99ce451 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00370.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b09e004930ceb43d8b23df6a14f08415f0aca4ccfdec94b3550070aec2d8b5f8 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00372.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00372.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..72cff488f99321ed5ef15370d446e2e59bc3943b --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00372.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5fd1a2edf6faa189f436c41334c5778ce5ab101faa59b0fd9767e0dd6e63ef9a +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00374.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00374.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a0d2f7134527aac82582542788d73c79dc2f73cf --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00374.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73f0a18782ac84ce4be14ac0de65eb772fe9219c93f474bc6a07051651a5b111 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00376.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00376.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0053625a60418a435d372b3e499120bd8fcde29f --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00376.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1938330928976b238f4df82e8228e9f399d86a83c6d2ff307d2ec23ccf28b180 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00378.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00378.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5fbc51db211528b9b135a845c88d86bd3c97d8b0 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00378.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de8b6f461e1cbd74f916211649043e4b94c045c30cc6167a2d450e4cac17a86f +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00380.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00380.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..32fef0818bdb8c32d7497309f2b4d826137526ec --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00380.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a9b11138c43ede367c101670eaad69336de5d4db6fb949a6d9d424f4c8f3eeb +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00382.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00382.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2ea2fe34ec48876f9155d6b0bfb45ed27a4327e4 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00382.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8af73cb8e20387c66d942cf731a622ab595f5d83f30f9f9468490734f1a6f66d +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00384.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00384.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d8954669e09c6926fd507f1847a1a0c997704d01 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00384.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aea3b2ce70e1667610f875195e723a83fcffa52682b8a9e2e07f5042266e27b3 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00386.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00386.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e7a55154c67c04ff0a529168f9c5c9c5f317ef0f --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00386.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58dadc9c4231c8c92669e93d0f4055bf5c9a3d542d6400b9d7adfbc2b5b3eabc +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00388.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00388.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3e9300bad89a554cf0f8e9cbea8c6744346667c5 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00388.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7f8eaf3276bacfed78dbaadb8cf811a6c92b073c2dbc4abdeefac03bb3100a2 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00390.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00390.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b1891f3daee87e72bccd2d9adc5cff5f6693763e --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00390.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f76ee7394bfafdc919655fcf1a55ae87fa93032de3ad637cfe93b352155cbe0 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00392.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00392.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..cff50e184c568200d7a6f14f50ab450b3dee04da --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00392.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb97616222c4bd65c7bed99a28cab5f690443b061dfa8a39948ffa1c47404887 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00394.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00394.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c9a06a0c1ec3eeb0719c7fad965912f9515450eb --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00394.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8bb9d1c8a1dbba92bf2c91ccc7e18b664a30a0983a7d4f8cabb73c5e50cca168 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00396.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00396.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e68017070c2cb3c89d31566a1aa8ba8f9a7fb5ae --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00396.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84ba1d354612568a0e090b09bfdb0cb4ebd6ba142c48bb3a3d9e26bf93145e5e +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00398.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00398.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3d74d9d73e9a613702f91d9aaede71a8b220ab32 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00398.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a590dc5eec25e2cec2ef73fad5d982073536d9fcb6c226436e95a0b3bc80f7f +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00400.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00400.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f1f82b38c4fd4b030d9161def35822341d47640a --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00400.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d13cfedb3d4698f53ba4df4df17ffefd23b8c1d63bb13f5beefe2b90b81d446 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00402.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00402.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e3928c6524120f35153b0b696dd5e19fd5642873 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00402.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89d108417e25fb31545db625b1b89282720787fda5a282e6d020b39852823e0e +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00404.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00404.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..079bfc2bc6a1995773efb13455dbd23c363e930d --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00404.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca0b71cd4685323dce159d6634cb8fb0e656be7597cd4f465d7b3db431a022e7 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00406.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00406.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..869ac8e842712ea10ac577c7c51d97d3572b5886 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00406.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b552cf7196ff910a89be4d09583f5d318e8bdec9d7daf97dde1a49bb57ce7450 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00408.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00408.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8e6c505e48f2ab657ef570bb5a61b0aebf36f261 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00408.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0d99c95889e588665f5e6ecdbe4a3f2e07c4a47cd4b3dc9341b1eb98cbc514c +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00410.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00410.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1ad7493a58aa4fca54e12b3254244905848cf786 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00410.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:456e2384d391f3f1f3293c96218cdcc716fcb4f16796a53298a4d2c271b28d2a +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00412.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00412.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0569dd629cdfada552a1dcc4ceebfc31aae22dba --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00412.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b0450945bf6c1ad41cd2f7524a0bfebe4ddb17256e28a5628a92b1531a94579 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00414.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00414.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2a685dd550900db3b8aad9facc3b9e4af338f4db --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00414.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a753c20eaf111e4721dd5e2bd79c1b6a23e562eb660c1fb775f4337341afef8 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00416.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00416.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..cb65ee057745f4e10e7afb533b8b33d7baca6907 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00416.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7124ab934dbe54886e0c8a6e0dd3cab29539a658ad508919f6fc2d5abab5797 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00418.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00418.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..258f84e96c832d6219178857a8d9ba3dbb06846b --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00418.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb351953075f049a847dbd9e8f9a4cde87e68f9c1ce954b8b17bbe59b3edfa2e +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00420.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00420.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..61541b2e3e7f09c48cf38f0ba4802cde6a2bb808 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00420.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:018c09f7b50d84924f3d2d3be8d8bb7cf2a47e877509423a2d70d5e07281d5ee +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00422.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00422.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9ea055aee0311830457d213451c100692d706941 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00422.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a48dd10772e9b8be5c20b2864bb8454061aa8c8231cd9deaca5e38af0b296a5 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00424.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00424.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..03fd2845d1758fd6d7b27a7ba76674a392a1193c --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00424.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05bd54af3936febd416c4d8ec008e2331645a5c4412a8ec7b9bd4b5175d66ecf +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00426.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00426.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7d295a4d92ac0f424198c0a2be034e870cbc7b7c --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00426.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1df97d028e86bed3cc9ea68501019016c19eb2fadccd9f77f91c9813b42a9b6c +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00428.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00428.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..99108ff04f590a2883e6ec659f6b79b2d1608148 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00428.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c054283253d2d49253bf0476dc5d610b8f2ac5997f4468bbf831b64ebedbf63 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00430.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00430.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8cf8261fe5b56bea6db082ad0bc3a6f02fe0c04f --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00430.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a98b20cd5872631b7f869b62878c8df181fdc5623aa71e10ccbe09faf2940f1 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00432.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00432.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b266ac635adc05f89c45108cbdb838d57fa6f693 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00432.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed642039612750db7777e5e495c13af31889659a29ca4e07bd4e8229cab1d326 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00434.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00434.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b697709eaa6385340ae098827765a0d424134efc --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00434.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b697a5bec7f7496889b1955a2718c6fa81a773f69427fd90f973a80dfc3ff84 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00436.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00436.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2c7fbc433c27d68707f97249924d01cf91733e7e --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00436.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:950b2929eb2f9d4aef028ed3e6eb48fcdcf6ac6b7643ba761477bb52ec23c2ab +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00438.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00438.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8c527f8ad5d94764f9dd529d03117f24566f025d --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00438.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0a47b03a7635a6da120172bad71a0cff13f5be94fb127a78b56d2ea246e798c +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00440.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00440.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c2dcab26bcfe61e75980bf5094b0533bf107083f --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00440.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:457147e9586baa529497f44073d0822a9cea426fd53cb55080a3a0d13e11aabb +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00442.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00442.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8c2f139fd17a29e13bf9e09a70ec750c002c1d50 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00442.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7026fb60ce72f3cd967c2966188912084d737620129171588a9755da484d5652 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00444.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00444.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b769327e10b4aaf638254bee0d118cd8ac7a9390 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00444.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac1321141f8f4fa87ebf04c9cea77bcf787c7a110342456ef93bb75043da259c +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00446.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00446.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a3fc93cc910d079e3de155ede99f2784126cdb8f --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00446.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60f234a38ffa8a0f445372b5792b9e6de1013f6c74e0adfbc067aa21a1fc37b1 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00448.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00448.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1615d9548bdccf1f911c2dcd13d023d3c19849d5 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00448.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e9c6c27b418c05e79bc8635491f416c61267f04b9950959f80910e1dd3c4ea8 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00450.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00450.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..26ee10c31c5a172ea6f16a6c7e504a83320ca94b --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00450.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e558aca5e1582dff87a138bfb6dddf99b340efba48965464f02b3ce32b96ac0 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00452.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00452.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7f6c271e375f239fad466c46049d59d18335d17a --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00452.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:976af9094e198dccdeced5ab45021e285e3cada493f751a17368726f1c7d680b +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00454.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00454.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..463cf30c08559b9f738303c75c7f91b2ea09da54 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00454.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17abb7820de90f5d70242888ee908fa5f35847c158a2645dbbd4bfda3905c1cd +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00456.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00456.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..aecfebcfb5c827a37321fab480ee06fa656b8924 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00456.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da3c814353b39d28ca274fe668b1a67cf12071b561b905ff9bb46463ac8ac01b +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00458.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00458.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..56b8f73d645ddb17c01ed62f973178f6f5f6953b --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00458.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:805726a2145d9a6d971717097da0f279c2dec356f6fe45d0360fee1ed58de9dd +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00460.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00460.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..fb6123f0082baeef183db149235159a790ddfcfa --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00460.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85707358a68b08cf0d4ba63e57b9e10591e9de3552a833dd3dfd05a7a91f11fb +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00462.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00462.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e5e6efac37389a7607e632e82e2797e65045bb11 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00462.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f003418497928207be1d562595a05a3a61a019f6873aa1d7708d16f5b2b3d243 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00464.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00464.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..37fc91da12939a00aa0ad4917a66c5b511c13010 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00464.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:752ad3c0a32f8dccdba0db5db97f1dd1f13300519f5f7c97fb0f1cacb7a6a6c3 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00466.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00466.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a89cd85e7a9d94880a5b2979ce68a89a03f515aa --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00466.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad820d829a02f80b65756dab258e62aedb24e2f42e47cc15af838f7bcf958c9c +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00468.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00468.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..dbd2df5bbb41d3a7b96a619ec7a1a83f409df5f5 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00468.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9e19da6a11f9a9469db57f8214f347798f6a25ae601c11eb19649e0b0cd714f +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00470.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00470.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c945b6ff1cdd8b7537d101a85790144bdb213361 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00470.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14915776d17030f0a5b11201fd5d3c8d64a3d38c754af682c0f05ae029a69a5e +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00472.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00472.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4f7e69c4a44e4375ed3322d1eb7f73fb5fd2874e --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00472.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc0cc4bd5f843a819bebd02313a127b0280c214a492c49e8d1ed92419565ea19 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00474.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00474.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a314ef099b947eef225eada43e58e319cf9ec66f --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00474.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:afd5bd0d7a6c008a59e20c9ef968ed3369a24e06f3b6aae4d3679f4d167520c1 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00476.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00476.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c448e441cae1d4ad884804cb666bec02864eaf20 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00476.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6871210cb95f03c2db9e58a6490e7654e1612e71af54aa71dc4d0e2fbb450550 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00478.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00478.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..bd5408ce5abc7c169799d687175cc24fb51ea070 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00478.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:458a6e5813f20945c46ca4ba869f1d5e74bec5254db2f85169b2ec0fae172718 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00480.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00480.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..77556ff94db881a9fcf88e83d8372ee315463b51 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00480.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b3d6bfb615865ce3dcc15334fa1ae33cbffbffe42cd221f038e111a5c84301b +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00482.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00482.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ee492f1af93fab8bb4bebe35f5ebf0f78f7df259 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00482.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4acf672939b8ef489323203eb9a859d7ff5e223d3d5155a65895287bc6a76b8d +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00484.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00484.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2a697f665228d3e5d21196c2f522d9fbcc0e034e --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00484.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:455882c178bc7b90642b8581648e496357f4026abac2601f60a28533472036ae +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00486.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00486.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..046377e3eee3db3b5783e5f98a54e5316a7da62d --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00486.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ded5d2f59862523eb0416d9f7eb454fc11745396156cdc0a2315e3e0263607b +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00488.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00488.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2ac2144c995107a3e626694408b4e355122194a6 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00488.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a36ad365f5efca9dbffb2bad3a80750759632b0d8bf0dbb8d382237db9abf03 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00490.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00490.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d6a2ebc8ff30ea6a01dd992fff7db2b6faae04fe --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00490.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce3c3f766b5c520e681cc8d2e9af0a4068ab4d7e2075ab5bdefba342ac014ab2 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00492.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00492.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d8389f94e025fa20aa4ef1f27832a711a65fd292 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00492.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55af6038c5cf24ba885498010c74fe6a7e4d05efab45aa4fd623d5e97300ab79 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00494.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00494.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ac5392db86a0e1552e10407eb1913784ef6b539d --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00494.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3ce926f24bc778217fb8bc9a49c8d4be38ce387d539d609eb6be382f778b2e4 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00496.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00496.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a58846b702b6c7d8f42c049e60c8d9f4f53712d0 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00496.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48cfefe6e7672cf2d48faafc21cb80cc77b33a5f4a6222c7d46ed10733ce0326 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00498.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00498.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0cddf2774f4a0b8f094e873002ab971f076257e5 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00498.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:559ce54449ba110ef173dc6fd649d15acdbe798d9e0003e12b8f1669bcd4099b +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00500.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00500.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e9bae4c24756e7a764b356d8e60c63d6502748dc --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00500.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4992ff782e46d45eb34fe92c2036a200f181f72945c144aeeb3f8ecc98359133 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00505.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00505.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1c238587e88bc031f76daecf823809b5fc3ab296 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00505.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:015679e02d0f4e20189be0f9af9a1ba2389f16235e115a607604cdc9f22254fe +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00510.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00510.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5709136c791a63979dbcbc2ab23b2ffebdd65a9d --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00510.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1476eac43965e597570143f98540c8979ae1812ea0560a305de2df777a86610 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00515.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00515.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7831e0f9fd12f8ab509157b0b7b694d7dfa9e4d6 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00515.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23ae6ce6a165750f200937d3ae4ecd63b52b33b40476bbc9964b44d28dd0c39b +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00520.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00520.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d9f7c61dfb7d1e4508f13120722764c26ebc64d5 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00520.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab503681b01e3d50bc83581faa6c1c58d1b5812c437f1ea86c08df1d25d4280e +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00525.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00525.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8365290b695b0ae98f4dc6abe8942d8b4f484be9 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00525.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82fd6bd6acb8084bca9fe59126aec38c9c135f853c17ff359e2c897e570dc099 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00530.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00530.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..422511494ee61c8d3c1337c3bd4d0b8181ae44d8 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00530.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0c4a532f4519c0ba79a76e933ce706701025297374a56e994c80b80f95bddcc +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00535.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00535.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c4fbdfe9e596b0d2a9194af3f4b4745406531754 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00535.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37591b8a71db1217fa2b6d606f63b57bb04a64176f8c73ede3712698bbda08a4 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00540.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00540.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ac1287a66b25d5b43da048ef76881a1edfdb76da --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00540.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1e789ca9b88906085a6787533f6bd589d87c05aeb19198e3e6cefa7734282e4 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00545.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00545.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1cdc43ce8dbfca95c0976c957017bf14515f9960 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00545.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51c3ab45cdf2e85b7328c4e7fa3281f4648578d4cc82705817898db11f687cd4 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00550.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00550.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a71d930b64546a07afefbd5e314337754086e6e8 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00550.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9bce77e1ea0676b8e98ab7d6ab8aa6637b2943bce6cf498c9679e594e9cc808a +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00555.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00555.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b9f1472f046d0a2258abbd914a556ac903019dbe --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00555.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cde4e8e37d361f44d07bb05e29a5c4ea61d8208c481051197300ddc0acfe72da +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00560.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00560.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d3d9ce6e3974b2c8f344f12c129ee0497315048f --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00560.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a081d271170939c95eebd12e84b46c12ec852724e80c99c7986480363c7ddc4d +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00565.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00565.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..740d41263c43b4e45a6c1202b3ccd84c399e4231 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00565.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33e1dc32095b606a188b4a735b7ab12e6b29cf5c2cfc43aea631f53e86d4bac6 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00570.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00570.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..701b7054fad65573ce7d3af8b12b3e2d9ad814f3 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00570.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0d62daf4b356c486840c879b27704f764f7afbbdbce8efdae572949dc6e5705 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00575.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00575.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9aa05a7a03cf8b7d45311fe7356018d064a6ab0b --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00575.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c63386d8fecf5d1e1a9035d3789d144854be599e7dc7a12e44952f063aaa3598 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00580.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00580.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ee3aabfd77f859f2dac94fcea134f2a273c7142b --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00580.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f3d9460514613d792545d8df3ee55d6c4d9dc602223db3c6a853abf78b8d7b1 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00585.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00585.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c76ea55ea95b1244e72e2dabdb5f3eeba75119b7 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00585.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6bcc78f6948127c8dcbbbda6a5c0b14ad9c57b420a9197fcf9df28c392a198d9 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00590.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00590.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..63b60cb299575d7151bfa24edbff7ff351912d75 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00590.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67646cd3c6c600cfa26449954a993629085c4a75cb5a1bdbfe3c6fc0b49e0090 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00595.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00595.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..67e9a32cd6faa01de38dc874a12a60794404a602 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00595.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c6d35150986d4ec5078f6b6d5da85113006720a47555e70996c518b993e64b9 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00600.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00600.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a120e1ef872eddf5140ac24401ba87307e2f0101 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00600.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0b8453a264d8bb174d4c9ec8d0bf19333fc50b1eea9a6c8222868d8da29cb08 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00605.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00605.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..daef74af7f617401ed07c47d2394bcc22e1c8879 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00605.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9541fd6aa998505a08ed42cb10408f0ea4d54c126dae3c3352cc5b07f99ba62 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00610.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00610.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8ce47a5c0ca58d6b84d2370bbc382602ecf87752 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00610.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae9c9a918f354d71d64c2690e77129e41ff272749e9743c512f37703f036e34e +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00615.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00615.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..92f40de09c7bf7a239c9e346e6cdaf1051e00904 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00615.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f51e7d90aa7d703109de040fc9d04fcaed95e9883f3daf21bf19184e3ad9d795 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00620.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00620.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..01c433b432de1311c2539eac7972e18a470e54ca --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00620.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d6a690ad44b452621dc78cb0b7fa4f6bdc21e3d2b23b8a277336a5a079c6fc4 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00625.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00625.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9c02c88f42bf66237a1e3c7f221bff54044dbccc --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00625.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cdb745782f183ca10bc4f94a3773796bca7fb52020d9dedfa3356359a1f7afa7 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00630.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00630.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9333e2c058958e5acdc1ab695fa66c9a840f7bde --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00630.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bddbfe321024fb2943618b6ac58772a4c506f752136489850358180c13702f35 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00635.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00635.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4de3deccd98b9987c663c978ec14bcfabfa6fbeb --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00635.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5acbec719413a569243bf462e4fc0f15dba5e3fc6f80dbe5a98afb26700cf731 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00640.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00640.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0acc00df1de66f05c9b89332b316e0bd7cf664f6 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00640.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1fdaae2b4d5ff57c260cfed77e13b4326204f2f9d6f143ec15e1764a790d66dd +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00645.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00645.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..df37e5475b7d021776210de35ed340fb2fd07a28 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00645.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a07c7d58dc0b1bdb61bac5c59cb722e90e316fcb883557dc70f8f79d36cdc743 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00650.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00650.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e277c14baae9e9036986488793920ad976a642be --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00650.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf04447cdb1f40de3f1bbd875111e7cb1351c73dde3eb8c890f8c1e9e5c4c532 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00655.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00655.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3ab40e344a9945bcc11540002a4f048191db8b3e --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00655.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6bf0d431ae8f32f4f156da6946097d988a8f6c664c0bd0404e9b843879ad671b +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00660.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00660.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..49b889f6ab76512a696e0fe41729f236bb9514ef --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00660.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:482c49c003b5a0871e9ba9c3e4f3d7869ad9e1ab5fb8d7a09d93c297e75743fb +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00665.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00665.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c31689121db24c6f3fe8ae27aed03144a572878d --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00665.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c00427fbe7bdd65e2ea8b12414be494e2fcb8717777d62a1978cb100f7585d6 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00670.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00670.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3a232224e6c4a6308133cf031034d8ade68d56a9 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00670.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:677fe87700c985702abffdfacc8ad7f11031669ba268ed8a15497c53a3d11655 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00675.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00675.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..457704d602cfe7dd508866eebf97deb7d2f1a185 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00675.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b23f93b602be84c61c980733a3a78ed68f3a1cb658c7d735615536eb59469191 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00680.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00680.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ab886740d7912f7d461521b9a7985f1c8a102838 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00680.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:144c848a05fd71f841236a071144f676117e890b1ad4edeb6fddf88308a6b601 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00685.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00685.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b9115495259831ff171c6649bcc80ae5763fb9be --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00685.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:871dade365dbfbd69dd86386a37ed3147e012db536baf7a462d1d75877ca9b73 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00690.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00690.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..135f405c4c8f7e00de53c0b5732afc71ceee753a --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00690.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e716e0a92abdcf4e0ba0724df1bd408e5625000a83f592b4387e1a7e1c644ec3 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00695.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00695.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3895d5c8713818c077f2ba07f748eeb915ac4b21 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00695.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c7e887bd832f163c2a396f9a2ca080df6a7db04d7f7aec4122bee0e2da22aed +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00700.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00700.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b04c27fd322041669239c5cd42784b19bf10ddc7 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00700.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cbc5d6ac0f0fae3fb0c897a8afcae92b3a41e627bafd9b377a6f3fc343a282b0 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00705.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00705.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1acc7fc5974a8f999401badb7a3c9dcf476809e2 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00705.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:451daa7a039d14c30d7e1ebeb132755cfb6a5086c859a1a4e07790de461c3973 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00710.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00710.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5e9f6bbfd25ae40355054c69033f80f4489ce16f --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00710.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b77b491b93a408d5124aff194fa1e05d51404c08a10cb60bc9644aba25369f2d +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00715.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00715.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6cd91ebf219210886aa2bff8566b8b3a186db5a0 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00715.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9be87a7eb9ca97ed1b12062bec243e4e4b3e375fd8b46fb84f312e7c69493e33 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00720.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00720.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c09473ca5244bfeb5e3a7e93b378b1784db9c1cf --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00720.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28f09915361c8246efd9a490d968eb0ce8ad71fa87d79fe842ab5b91f607e394 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00725.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00725.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..be2825f837b3cb54767da95e772464064b60c489 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00725.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:339ce2e35ebaf03fc92dd93b04244c3219f235803421f72830e1036fdfe7220a +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00730.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00730.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d3469820f21cc66bd1a59ced25e2fd2503149d3d --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00730.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5841a38a53426a5af5b67c4b0f6f28ab1da73a65ae0b84da6d72d224a7189301 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00735.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00735.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..bb8ccec589247eef7c0a4c3861f984f01ff3dee9 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00735.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f986271c0ee6e1f9359a425dac5642b30bd2e39670fdaf0dab2476c9528cc9e9 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00740.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00740.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..165ee2f0c2a893b9527b27d05a7d630b10e2a436 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00740.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:986578b48944dcdb91edff39cb3ece91538006ae698ddf24fcfd72290d6497f4 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00745.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00745.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c40ed0a0ae389b8cda3dc1e511d1d30db89f9e5d --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00745.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2eea7ad59e3edc06d2cf7706954acb7d874970baa2d44716f98b1fa334bf4c69 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00750.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00750.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8b5fb4653cb122972497a7dc0dc312611e789eaa --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00750.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:020c9d4f312532675d13ef418e999dcdacc154392e3c9f3c6e6837b7ae1991a2 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00755.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00755.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..01f3154a42c4e966c3a766f270cd74cc5d8c930e --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00755.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cfe1792fe97360e5cfe82e941e3d3ea14c535f8fa797f65eda7414415e786a94 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00760.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00760.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..775f1cd26c892f76259b5003260b9123322a506b --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00760.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c0e2d288ef441a3ac01098613ed0a91380e70aa74791977ed487138deba3445 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00765.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00765.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2a5b1587e04e27e394cbe7670c2760fc1c60b2f8 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00765.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b6af81a9aa0287b25ac3234b5fc35a7fe6a7bff8f00da38ccfed7076711b37fb +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00770.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00770.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..53f257147299da2f240374155173cd4e5e46b950 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00770.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c38935e8f3df07b06fc511ac69a59dcfa41a4b3163bf7f9e02f6354cc21d7e3 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00775.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00775.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d9b818d2c83606543b77ad5f849a31d195b98abf --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00775.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce2d8a7e6d92c14a386f05a201d67840e05c3c57ff1400baa8fd5ee8cb627d48 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00780.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00780.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5205790746253b35c5b84b8a177d6bd00e3b9fdf --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00780.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84c2e043a6172618d374dc89d009fc15e882bbe99ce5675f3b12cb2ed1c009e7 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00785.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00785.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ab9bc4c2c56a2ddd19b4e3f7a57fe23a6911d761 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00785.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5520aee7f7295dde9451957197b0fdee2d6834a47b92abbe07dabeddbd7ba2b8 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00790.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00790.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1684d3c9fbe0b73160e49a2b36f5397d9f7cc50b --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00790.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6bb97066176af8ba1b4a3fb6239eb9c4a4179e99a2f4218b38e530750a7d2d69 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00795.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00795.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5bedcf4486d83aa27ba0d3c14aba9d85e8f9ff48 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00795.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3453433048b5a16afd477b122bddaf89376932cf0a4b6b0d9fd02561717663c +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00800.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00800.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ae75a316c95e1213401d1ebcd883c891e232bd63 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00800.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee3aef9d7fd4c6b9535874aa8478a01dd9c5e2f1effd0c022d39c1f4cc1f60bc +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00805.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00805.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..844304447480e7ca603669a1d2deee2093ef11f5 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00805.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:874b6124d890c4dc0dcde9dd6e0448dd1d6c9244383f04dd0d9e275eabf18e3c +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00810.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00810.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..589488f1d66490cad921c043beda767ab99b6114 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00810.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21b7abd487451255df70c1997e8cb4a5133aa75501bf8722c594fbf84102ad15 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00815.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00815.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..764e8f19a37a196c594a0675512b1f6c55072f0d --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00815.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4cd96d446450fe4896fc6312d0d1684a24fef18cc9c4358614443422d17c6e34 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00820.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00820.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..bd283c9fa183260d1c361a76ac46b4ee2ad8885d --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00820.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b11bc00ca4115ccd7dc2979568e60cd5004f4a63ceb6f071f0d6cbeca66b32d7 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00825.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00825.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5a2b4e052634bfaf2aeca2d0bd3c9befdff6a256 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00825.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b3af99dae8394023b8616ea2249991352724db35ce96752a623672f985f63a9 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00830.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00830.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..95706b1d893ad15cad6beec5289552670fff1349 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00830.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:688c477c84d9d6a9b3c973f57402ff6eeedff592bb8ca62c35ee0a803fedb6c1 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00835.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00835.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..adb4620327e0768b2e8a46bc74db7e83da23d5bd --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00835.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd7bf2eb26279dbae11c52185e65a80d7f633b7fabb1326ced81c5782c91a1ad +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00840.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00840.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0ed761190875a4ed8d90f7b1f907405808194603 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00840.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07f35cfbc7cb4b72832e157d299f8e8d4b82cd97bb4784719b8f63ff5cba5332 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00845.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00845.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3dfc1fcc4cbae655843c7293ad1c8572b064e548 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00845.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22b736b8ad33a1b5ae95fc58e43040a0ca04108aaaf487e5f7daaa939dc5cc61 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00850.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00850.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f0e90c3e1260f7c421d91244e9dfee4076fc06c4 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00850.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5afc5e398ec0b93f7407437a8380a2cda414ee7bde576cc594ec351a44c9b9f +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00855.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00855.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..113c9f84a4933f5bdf5083ba55b81d795fa12800 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00855.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5626a87f3d68fced27ca8ca5536bbff425770ce859fdb04917475541bab83556 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00860.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00860.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a574405e90ba1ea73da784c58b8c921f8d26ca5d --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00860.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89b06dbaa6e48b8de523f37bd0bca46931a6c873b49ef7def72e04edb751b669 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00865.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00865.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8a120d0484421a438e5e70ae27bd8c97245aea78 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00865.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4573ff31f282e19ca4b7d08111a8be0ca239d8a1af8bcb508637852a57ad94cf +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00870.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00870.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..89523f20f6b4443cf1461f016b4994ea3fd4a6a1 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00870.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77a29b7553f4871089ea586396f611ea033dfd99f0afa236342a51d672c168c0 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00875.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00875.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3ca1f5407deaab0403d30924e5ad709c7a2aa2c2 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00875.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1fc192cf6909967273fec1da4d98556e5e40e305f51e189c34859c4c59115ad +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00880.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00880.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6760f1c2795884822df52f232445f3249511f147 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00880.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67afba5de5bbb5906240a3b12961b13002e7ddeaea576f6b66cf0ff1284b7076 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00885.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00885.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9eabdac08f9e65547db0a20e3a73295bdf53adc3 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00885.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4eb2b18a34b73d3d9b66f4ea5594932a9661f07e057303f2067304730ce973b0 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00890.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00890.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..826c88f993bea106907fdd96220ecfd778d20248 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00890.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cca6fb0489812f83fb39b8640828e7800aa4aed9460bc8865ab5a658b395bd56 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00895.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00895.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f0506f85e8d04c1da7f2113142f0387e4e3048c8 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00895.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6aa09f3a603e0672340ededf9ef349b84fb8b0e19c07db0da5a737f84c73fab6 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00900.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00900.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..99fdf8f87154243e709275050a76eb19abb9b0fd --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00900.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ae179de3e3174b633fdacbe3362970c89928032c15351414f8e480f0a2cf9d1 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00905.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00905.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..161be671c6a2737734a8ab3e4c4a97468e3b590c --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00905.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3cac6bcf714a0c0cff6ecdb2a42f40abd3e060a9a63ab755aa5355ad50930c90 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00910.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00910.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e7e6c0b23784f556d6b38efa866c0c770d05b542 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00910.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f34881416211e1ba505acb108149005360dcc0407d7347459ff3f7d50e41ccfa +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00915.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00915.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1125935871c646e1b336b9257c63bc15678b9c39 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00915.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5014abf46c91284765bcf1fc96d76bd7d167dc2f281bd453c3e369bc98c092e +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00920.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00920.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d0fdc09b5f3c2fbc995c1d25feeffbdd1d731b50 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00920.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:081f358198ad99c25dbbbe4edcd704056d8dcb9c4391ce6668f7ec905455ee42 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00925.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00925.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0ed745cd2de45feda4889bd31c5bc39903940644 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00925.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26bfddc8a6031b77c677fd193fb71937e0b098a76404539febad0ce02fb53504 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00930.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00930.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8448afcdaffe4e660eb84c6c2dc7efcc163ff243 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00930.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:433ec7057b6c2d47d7c689464cb7005e3353ae751adc233ae78ae04b3d794af8 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00935.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00935.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3d830a4eb39a588ad93f741b3c22efc021b3ec73 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00935.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db25ebb3034f588d250eb16e97007e70263a6f4470d1246bde3a3c72d4de5a38 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00940.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00940.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..dda88ce72dfe4fa6a3f9ca91b7bb8fa407ad8fbc --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00940.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a4306bf796d1106f0549098edf6e02802d9dfa28709df6383cc2b0a6ce86a59 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00945.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00945.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..74919c2c6601d16a813817a65ff24a976135a68f --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00945.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa44dad75d63487782c879c56ca863e5ab196ff0b46223d3a45e1ad8445aebcf +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00950.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00950.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e0e635595744f5753c4ff21864df4c46cc059d02 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00950.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:264c40936af2fc6a4f6ad3ff4ab8a102c1c354abee90c64a411a438ab1be9edb +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00955.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00955.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5d29515a7321098b096ee94a237023f335a13c1c --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00955.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b8373fdb765e3becc9a9bdcc4fde2290a2212820ce37234ee4938608de7e0d3 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00960.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00960.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6dd9ea8b05823a8ca56fe6ef76b2cf35332882b8 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00960.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eda1af527b4b90695594b1e28ae8109ee4ce3ce350a64936d644e5e9b184b53e +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00965.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00965.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..99bca71e3b8fc3ee7118ae6677e0c43a921f6c51 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00965.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b37608b294851a84b86e54e25235d3fbf6475781b97d92fe00be1045d9b7f761 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00970.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00970.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..bfc411fee77a92ad24fe16e2fa7746bc53f832dd --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00970.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5344c02a93d39af57ddf941aea45fe9a4365d3f17400545fe9356e1f7a139955 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00975.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00975.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b125e3b896721a0dc734c6ea992fbf29ef42f8d9 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00975.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3b0c19ced461e6467b26a68956585fbab3ba091a1ad4f6d55f71b083a2d2989 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00980.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00980.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..21e9862e88d12b63d77fa55c2b52cc9a8d48f97a --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00980.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ccf2cec137c6235d50d7ab37830783409825a512cedf4629a6bba547411d7ce0 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00985.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00985.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7700fedb8fc1599b60faef571c9caa5c9643cac4 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00985.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b528ce5642f99b8f0ea12c2709d401ed19f1ad28feada42532d1fac15da66de9 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00990.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00990.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f32362a16f0c664d5d5a7b65cd3f192d6e3eb821 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00990.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ff92b6d70cb12da2d6e9837f957a106aa239c6e2c769e119073d14ba8bedf07 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00995.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00995.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5e25f719fe9ce2e40470f9f9eca520d92787e6ef --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_00995.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fae8ac290adf98dfa9f5e3d2063435df599082864f0aca3f65b10288600a515f +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01000.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01000.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..08c05fa9c8e9f0ab93dbe3c00def29e5f712d754 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01000.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a52916e93c983c7c1b0d277884857c647e631ba238eb339b2c83367283fe3ff +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01005.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01005.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1a3157ffaee09de69cd968d8d55d2bcb3eeef014 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01005.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b582e7332822ea259e04ce5a39e30ba46c27d1618f41ce5c70714912067801e1 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01010.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01010.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e14b3d446d5b6a0c00b4aed40687efc5fdfdd048 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01010.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d65bdb6a45e734229f2298e056b2c14a09900073c836733df4adf4c5506b1d0 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01015.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01015.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d8ae4134a41f3328f36c9d83367cb86dd8bcff84 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01015.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fef145c21dcab070ea82b9c8cfbac7ac0f6be0162f4906e306df7426c5e1e42d +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01020.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01020.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b2f3925f0faedab01e9560f991c00a90dff07452 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01020.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:532ff25d12f3a161a70461e8fd04e7c98c5208d3b421e9c0c42b87aea72e3a40 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01025.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01025.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4170d0b2f698efe4bf8e7186b0713a2062762549 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01025.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4654a170f7f62263b2c372a04fd32282e5401f2021d46c99bee0b7498ddc745f +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01030.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01030.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c1a6a816af75482870446d9cbfdf044fbd47f8da --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01030.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c83b67b681bf5fc5bf5c09ffd9467c51b077fb4daed78a41d007e8635d280e24 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01035.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01035.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7dfc0a9fd44b46851a8255728d2a6b333ee5841c --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01035.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59e3631ecdba14cba01bdf722ab3f0b088a7a4adb244e9b642b60f0bd097a33b +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01040.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01040.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1ca7e9f275c358ad1528d0d988a0b6b132c3a0c3 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01040.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:79f6ad864deac0616a4ada94afa151c03914c9378fa90fab5ed4239cd0524108 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01045.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01045.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7e9b3077b7ae6c9f8ebb3811c4cf1ad98fdbf240 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01045.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c66527a56b779ea7ae9383fcdc4092566486ed4eccb57601f124c662112375f8 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01050.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01050.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6dc330c8179bc08af925365c6463485299662991 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01050.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04120b445b37d206829b23f187f873c2e1ed25bd95b3361cccd3ff51185eac0c +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01055.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01055.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..14a4914c21444bf19412a9575a413bec8cf16244 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01055.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b17dce3472545101286729d232f2627a58ec03220f6690bff32d0511134afa70 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01060.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01060.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..579c9bb14c382449505dc20e4e1d33c9fea6bbe5 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01060.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37357c34a656a56eb9311f1781b878ca2442998b3d98115562f7a9c6e765c141 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01065.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01065.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e9ed8690aa7c240d9103bbdc2a396c83e8d76354 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01065.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74fed10538cc7197087f74b13621d5a1aa8d835660c38c0dcb50cea68eeabc78 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01070.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01070.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..92b6869cbd3a038b6b39c483be09b36ac8e5c05f --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01070.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dbe6d949b6925ea1ee529d12fe96f1e172903bc6f64bfa685835ee772a601fe1 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01075.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01075.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..97b76ee6271ab6980033d05d279fad6ab03a2aa0 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01075.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab2810d9bb76dcc3c3d397be672e9e2046b6eef09f24f908b970b143cf1a7bcb +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01080.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01080.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d51ba7cd26bc916e62972b6a1705ba2d4f44f098 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01080.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59243999b59110f876ffa728ea4422b0a5801fe53bcd481f7aa085d47e116e4a +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01085.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01085.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d9b1d399b59e5e56c420315353b45c42b09cbc5e --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01085.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e1e67e5b18707ffb140149e1080213728f7166af6908b879219dfa029cf418b +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01090.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01090.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2c8d9dae1d4dfc8ea0a2582560ff34ab5bca9325 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01090.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc4d99af3fd71749e2aeb22bda99efcf7bb66459e96c37568fceca0ba0035722 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01095.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01095.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..df3f241de381dcdd60f669a1720c26a09e12db59 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01095.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a5ceac1b291c18b87401c0c1290c2ae3170101ff471cab8e247b9da292a4936 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01100.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01100.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..02d8fd4eb8c355ec1a368614bd9395e291f949a1 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01100.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10363fc0fa3339c1016aa6082bf491ffb8e7abe4f41bcf54056ed9e3540bf572 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01105.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01105.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..87f5a766a9c29f88265362d86c6e94a76ad2e33a --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01105.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:821ffb442baba4d842346473a780cd984b9e9c0a53e467d38a459b04320efba0 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01110.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01110.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8df97c68521215fafe034a42eba865137dd3ed16 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01110.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8d679995f0afccdd27804d72f2eddbff18e5aa9b0690e9e0c18ec53d8f612f7 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01115.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01115.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8d4116ae94aaa2ef929f4b3ac6162527869da707 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01115.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c412c3d5d1a0237340e032dc52a3b02afdc444aa9fa1b0c5fd21262926833a1a +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01120.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01120.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a91d89be3adfac8c9e2ee87ad725845724cf0591 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01120.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5effc8d4e94db2aa9c62284c3d7501fbecd6bce86463cec574e9f1cd88f5d65b +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01125.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01125.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c8daaa537d6a3865450951b00bb3ba7aab88f8da --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01125.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:789b8c89547ebdd2b11850519394c49a327dee2f4cd098fce77ee3e25f64c3a8 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01130.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01130.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6103c2be0b68f608e646ab893b7c64f7a2598a5a --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01130.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3a7bb7444f156fa3e67992c3438b9c3d2c101aa93b0fecb1d82a8b0d5051888 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01135.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01135.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ad84580b8b47a8ef4640186992bdf3b3baaf81c6 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01135.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d45e3fd324c0b187d581bd44a26087c63f0fd516055e40f550430e1f4fb36ce2 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01140.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01140.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5f32402d935f2a17325e5d14998d5133f9785ca3 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01140.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a97b6623bac84a6701365206010e4fdc238612bf6c986ad21d369b2f8903702d +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01145.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01145.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6cf79e4175a7e6bd77ba8e3d3f2b333a4f671027 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01145.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53535f558a3147ba4a82fdcae42b72e7a59a0931a543735676f0e0161fd00e62 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01150.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01150.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..62f4f9a4cad8429303a8b0e15f9d9aeaa6decb16 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01150.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46c869fc107db52b97674110b9321732aef5dda6d9876aaa82b405cb74875c55 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01155.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01155.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4930224a8ce204ea14882e66ff1779a26ca98b21 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01155.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:232044bc7af349fa079ebf8f4bacf93b37d08dfd4aba3e7b62b78c7572746a1c +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01160.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01160.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..116f3f8a1a97c109776e527ca45a922ceb152e52 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01160.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf5f8205183d937411d28c9508ff6c84fdabd000fe245cab9c04a92fe47bb1cd +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01165.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01165.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d4e6fe16dbef88f9afa773dff7dc1a3b429c8c2c --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01165.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:389d09ea11a086c4aa4354c90b83544b8c262b957525517734b9a1edec7b7293 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01170.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01170.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..fc3189b51bde6fbe721c8d214ba01a30ff42fe53 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01170.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8776b4fea602db2fd093022f7ba376c499b107fa2279090e74604610f7585a82 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01175.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01175.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..41b4b34a272ee52ebe7d4a51050c614760c27c82 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01175.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:faf89994dac682981583a3c06ee02b4c1ee94dec541cd86f546fe511266d64e5 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01180.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01180.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..dd815825091d5e0d6b1061f2dc57f01deb5be0f9 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01180.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4be39557d5723af19714bf716272c5a6f2a0c4752fe362841949a388ed5d06a7 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01185.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01185.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d900e5fce1c73cb5af14c5741941998130a51eb3 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01185.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26bb3900ff387b39cebad3e18ac118d24d08325f8b180ba465274017454015ef +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01190.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01190.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b9bb95d3362d5ca8ff1b3c4b113ea8e410f84536 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01190.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e034bb63586214ee1156bcfba72636e475b70a010fd2f8055d89c4ef81d30d7a +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01195.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01195.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c960ca78c2537381230df7ad8fb5c61d892f22ce --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01195.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d6fe9242ac54d9733a80450f96c54113cb67cbe863475a6b715ddb8728ab97d +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01200.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01200.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..569768717002e072934c0fcfdd397c0b7fca3244 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01200.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef84f80c703137a20746999fb0a83427113a89c49ba26d2b2b04c165d53fb8d4 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01205.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01205.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5a008cc375283e719d145e91e43bfa42bc12836e --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01205.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:949a9f67b8b67f5182c6d7c4b3e40f1e4e7358027153273ffd0ad7cd5bf27a92 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01210.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01210.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2718724d26652152524d48d52ad2e4538c2d6f8c --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01210.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb837a86941a7f454c82ce6f3af415d81f7c9ba45e61b6de2e850ff46bccf608 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01215.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01215.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5d39bcc9fe2f09a450a8b4bababcdc28f0767b6e --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01215.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8dfde7f523b989a920b1d04480db2fd52fbb38540711e3d920db85398dbfb574 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01220.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01220.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..04396fd5565054b0c0dd30470dc787bd55883399 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01220.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b20853e27c6117965fc7815280e9b1ab820d03bd2c43a06161602294067eceb +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01225.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01225.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6ac9d2ee4e2aa1574198dcc358090e8fa308cf12 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01225.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a44aed3bcd437b1aef634799a6afeec6ae69e5d87f95d26e0d758fa969325513 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01230.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01230.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..643fd014ea84087d4f2a554c9438aaa75aad5b41 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01230.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14867de3a3274e492d388a82ca54dee9a4d361ade12f8a387a233d2bd6b2d3c2 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01235.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01235.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..49ea32eff4143829bb48dc70625d1fa55e7efa0a --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01235.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b26f6ccc36eaeeed34808deb6b3de97af01943f1d1aa2be1e79a234a32c9ace +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01240.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01240.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..03a420ff491f66b1afe46d4ea40781558884cd12 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01240.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7413b554bd9ba6340270f820d7e1e9824304b5e0db1807cb08f9827d8977b4b +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01245.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01245.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..53924e8b1e5aa5ec1fb30928309ab9e74f31a8d6 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01245.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ef1e977e52984ac996a1b0f437599756f2b268ad7ed340c52a0f4b1ab08d9fa +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01250.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01250.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f50ae8687d52a651823aaedfad540859f74ad126 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01250.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:398b8af1ee1b7d4b44afba5fd8d35b90fe048a276d5ea257f2ff2d02858a4e5d +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01255.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01255.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..79147db497536e26afa963a59bc0040ec02e13c0 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01255.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba361fcff7919f748e9ad3412c05f085a7fe44109f6c890c9cca069812c95640 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01260.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01260.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..14b3d1c62e9e3cd2d854f22447ff6b6213a2d561 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01260.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70a0d2a21949a0adab5bff0674fc3dc671006454d51ecae2a3dad7a798bc488f +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01265.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01265.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4914a1f7afa868c89705ef719baeed642be74087 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01265.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39ff78bbf6a29df990d42258459d661136f342345f934624b34bc7b96a863046 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01270.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01270.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e94d05177e01e28dabcc27f4583c92b4afb829a9 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01270.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6cae731ff8b8b31c3b96e59849df5f351a6780c2d146169f0ce893f098ba6dd +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01275.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01275.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e97307d8f2b32206abf2689f2d50a7178827e047 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01275.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1a60b3ad9efe202d5b67fa3412c78e7c840c53e66a8c1881cd73618f3fe8282 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01280.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01280.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b70c53ea905d679353c45742e0a19b54e00019c6 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01280.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83dc68c4e9f7ff92ff626cb90fd775e64541819d59c3b22388c9a8d66a0cf9bc +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01285.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01285.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..fc7c800273093e2a299d8162c8413a17f74de094 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01285.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0c619d0393411deb80fac46cc4a5c582e6db4c110edd589d9c1ccf0317ea1c9 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01290.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01290.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..789c46949c3369d978b76461b4dc95d620f1251a --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01290.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:135d8ca7350f8fc7cc8bd4b67b4cadf79e9df45b4135833f00882ef230d8b3f0 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01295.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01295.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..061018c96f582787261db4d09159395bff65458e --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01295.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d41a66d3a49aea3ce79b3608c5f04d72182e90457d0a73c1cce0001dec7d92df +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01300.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01300.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e623386111760c61d91f5df6b1d2965e84e7e9b9 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01300.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bfca0360acd48b230cc4d35a02bdd1ed71bf7cd19822f9e571fe3326d885a73a +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01305.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01305.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..fb2188c0fbcfb6fac39c95d7a0a50f2b3701ea85 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01305.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b0790330b769951736e652f399985e6a8996c571dc4fd5b1b1bec29d15649b9 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01310.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01310.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..edbf6a8cac492646f1cb1539f72a825b035dd044 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01310.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8377d28d8cbdb934c1af791dfe5c71d64195f5e448fab245e0366fe2dbb2c2e8 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01315.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01315.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..beb342211f093aa02f5304377c00aa371b390287 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01315.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c539439e40fca193c15a98eef2b5c839f37729977924c0ec16ddd5a89d2fbc2 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01320.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01320.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..46ea6e0577abc1e1c1b27d8a1cdc33de34b6f46c --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01320.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42ea973690e878e26ea6407db5711ceceb61c29fbeb2156b4d05517d943a6e65 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01325.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01325.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8ac56f06ee050b24cc3709eb8c252ff6b9a06357 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01325.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c437bec724fa723f1e57c8c6046ce7566cf9c9b0268f4a0a318cbedb54a2a296 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01330.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01330.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..053bcb5d79bc6ab164504afe6cb7f1f8ea63d888 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01330.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5738491bfb09ff24bdb5a6de4dd6d311dec2bc217fccbd2a5cf2b3e511fd82b9 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01335.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01335.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8b6e2f418a32ecbaacb4375dcf93503d3b19a1c9 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01335.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0fb0625de8a65d3845cd3a81387422de9287874a5964f3c807ca3d385098c7a +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01340.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01340.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..03d932397dab7d6113a0c76aa1b5f41f8a8d0de4 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01340.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94fbe01a9f412b2c7e6d4ce06cfaa6a6ccdab1641bd8898dae64001f7b2f3152 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01345.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01345.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d800cac49d145a51af00c3384175c4416a077a59 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01345.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a79465ca28a31cf0a290f440d9040cae212e8f44ee45cdf9828c4d0a686c776 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01350.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01350.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e2f571f196ef8f01f9c298251bdcad8c4a2f5069 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01350.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7d84a7d40c48db1fbc9fd1e0c364771fa44725003109a2dc5a15c9ed8223748 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01355.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01355.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d10d95f591a76d295920de9527a3f3cedfe1e161 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01355.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bfb9552a407813f2785a7cd2422b3672594b33f48da7b7faf34c9935746d7239 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01360.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01360.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..85feb117ca7c4e7ab0d9a69cb5893113c05050f7 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01360.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cfa164c8059018a51f96a3ad95c52748e07e92c6938aad703d3f1fb4f6a730b7 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01365.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01365.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ac6fb2212b80031a37537dc42ae5fee6c7d4b2be --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01365.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41c7a215f6580be7d0af05e9dec0cf774cce1440a4b36e5feed0c67f893ad75c +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01370.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01370.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4927ec3115f10f0a4c3528a0e74cae5e8eb1a9da --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01370.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c874ef9f95ac7967951609791fe7e49008590d3cf0f34e2434c93ada701c9c0 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01375.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01375.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ce765bfbc5123736c54beee17ab3ce53b015e4cf --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01375.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96b2a09b90aa05d6b7fdbee9bea9ffebd6cd283662a17fa55388273bc008ebeb +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01380.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01380.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..da180e8dfca9c94004d989ddfc0e175a260fbc9c --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01380.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:789401e2ec0007e8f406d38a2bfbe5a8336b9087b14f27aafe4cffb5d8144695 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01385.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01385.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..796576e334981c8a8e44f5d60b3ad0dfd8c2bfe4 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01385.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2f369b7f960348176505541b6afb96b299b033da4985542a900f95f36209063 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01390.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01390.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..688d135e7e3e4b5f9d44e1bd1152ab764110347b --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01390.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:215fb3589eb60489ed26629b96802824576ba182c68a8f237e19b7cf6502dfcc +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01395.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01395.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2877d507d55f08fc86a52d0a4f8209bc35f35563 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01395.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9eca15552e3de4a2c480bb0b349016b032bc8c21d5c285576df78a9eb69862fd +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01400.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01400.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8c5db5dd5c014e0eb19643dbc19dc3c89747689b --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01400.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ab62b094cd4fc393028f7406115bf4ce0ff238545ce25df59a8dcbaf60c3b08 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01405.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01405.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9d0936f9f34b4a6d531004d9744673f01682d008 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01405.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:857d34a0cba90a9858927c48291996f73f134fc1956a17c5b81d1f4739a34ca2 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01410.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01410.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d9b1fdb4a37f889dc9f471733f9364266c643777 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01410.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9a8156fc8730ad5b7ae3551ac3930a04529e3f8cfc5bd098f3f9c2b1f2b83a9 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01415.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01415.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6e7c607022cc9230ec685af64531c320db076299 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01415.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85c1cdb4816decd204daf63abe427dac3e4b6cb8970755d9b4e2371c0e12e505 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01420.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01420.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..604298f752e14fea879fc096c596c18209da4a76 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01420.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1e4e85fe8977a83293f0a2a7123b263659c35fa7844cd3c31d644ed209b7abe +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01425.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01425.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..237b6acfc70c78786637032ba9ff2f8fe3dfaf22 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01425.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:264eae773a5747174587497d6dd7998e89dbae1758813ff6b8d31428b0da8f1e +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01430.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01430.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..46fc62b2a5407c89556ffba590399fbcba8ce751 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01430.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6bf9bcf375a9826593ddbdfde66b6986f9bd4d1cf3fa3461d35df40d8cd3481 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01435.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01435.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..70cf44e904558d7c54606f5346a4e87c3c1aafc1 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01435.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2cbddff2a202782a25f9977590662ae45c4d195e5fd7a1a74a5ccae05c5bbb43 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01440.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01440.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2c06c2a104299baaf5bc567f2a43cc301b2f193a --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01440.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:047ea26ffc850a15f0c779d44bcae8b2ac4ddf95cfc26e26235e2a70ff34f0a0 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01445.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01445.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5c41075215f6fdd0c04f9194364e1d28a5b9d068 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01445.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:823ff5c2c139f959d565913a1deb4b45e4b5bcd621a76c0e3e3acc80236d2e4b +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01450.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01450.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..865d14cc04505f247631c3e3d0fa6202c2ece32e --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01450.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c575f27471a4fdaa09b53da92ef1f185e9e1dc424b0b1466ad578d611b077f8 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01455.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01455.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a110143daedb8587a0ee8c6743b8a06c16bb48ad --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01455.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:702aa8a9c26595c14978389be94e8891a715780f61fcb1c5deb132ff8e4b6c64 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01460.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01460.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..338e4376e9d9111ac385e3d97507759d9db23610 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01460.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a01b004dbe12ee8bf33c0125c896855d55a26564b36397e01c2f8010391c5a18 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01465.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01465.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e60d2cdc75d2d1a5cd2aaff6beb18859bddfbe1c --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01465.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4629011f7536619f91a24901bc5c6ed6ac5b1d0c51bbe04fecd29c442dee7c9f +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01470.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01470.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ffbd3940f602f7b268ce7707be037b512fa04d7b --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01470.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1402e51b82c00a8385ebfba7e963533feac9d10bed843f5f2ecce95e07d8b18 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01475.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01475.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7409bb765b2b0ab573cbde255b61252a27ea8304 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01475.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22cdf1f864323a313ccb5465717b558ecd93ccc5d1ac80fc009aa80f152e8ffc +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01480.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01480.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8638058859ced7ca062199844284f931bf22ddf6 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01480.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:123a2fb36a21d3c59c3b7242844860fd59505ca873b425c21c03a8ad2f752f20 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01485.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01485.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..51b76018c96d21a48240248aabbdd5be3133b3ef --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01485.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d55162e5245c1ed47ff051514d6f757876861a116be1a4f6789eb91ff53c7152 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01490.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01490.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..bc67e8f5c2d259c4dab61141221e1cabc79ac6eb --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01490.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d82e91c34d4fe0804e64f18abe917fd4aafdbb9d9c7253809fd27e8bed576f16 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01495.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01495.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8d7e25650cfce355f6096db3487d2cd5dc067bbb --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01495.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0691a0043fcab24892b58c79ab86617f541d367b372f3501bfdb3340528d272 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01500.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01500.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c9891c2426ebb89b7839438abec179d23d5dbc93 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01500.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:293e783b910cc58c513421f5a7e1aeb88219981dd418868b8a8c78dfea4402c6 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01505.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01505.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5feb1097b839c64916e5e49ac162f5b8aba9d170 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01505.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5bb2dc529ade3debf6f6a60a016ff7d795ccaa901ee7f4e072241e80adc912d4 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01510.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01510.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e8a91c399decde813c715f40e684b9476ba3f0d0 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01510.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1144f9ca9c0eaaf030c74c7a452c610bec31d740f5f4755df32f89a664239a71 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01515.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01515.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2ea168b575bd62153450cf883cc46ad45306f3e5 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01515.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59d3eb0caac314dfef708a85f1d02c105de08655dcc463706e937c6a040526d0 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01520.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01520.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a7b3f9c1e92c56a6fd40bda48e6af6dd41033512 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01520.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:042749ad1e30098342026803dad85f38b6f50f2cbf68d2f3393b59546c1c2a23 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01525.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01525.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..31f63b46f398fde31080a1006523460b425ccd25 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01525.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e04ceab7914238c5269bd3de5ad4b4ee16b696a7d93b9d95fe6d525622e6c21c +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01530.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01530.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c46d78e30586b4c189060754b7fdf07afd2a72e5 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01530.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:901be125eb2a717921cd106b3ee7049190338f87744d8c28cf30611d62331f09 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01535.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01535.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4f5789f24597739790a5e64c571836404e9ff76e --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01535.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:654eae974ebbf6c32525bb01a2747185b7e2d605c61159df75368f92ace6eb0d +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01540.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01540.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..eff253d2d60f7bde2dbec86564d4c2ecb98c18a3 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01540.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9bed15f491416b4a4d48c3619057422668aeeb8c278f7b270aa3c07af845353 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01545.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01545.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6537df9a8faa79b6a41db49c7af74af4c5e37e5b --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01545.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:289f26798881477e4789a098d0a563233ac590f53d9f945adc875c632aaf280e +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01550.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01550.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1dcbb4c46fd6902ff511d491d99ec3b94eb4e3a8 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01550.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7b9365b889f95982c1a7c813d19a245eb7c7262518a6e137893ec2a11fab88e +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01555.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01555.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..318c4e036a95043bca794c4d290d63c06f59df6b --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01555.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20636ed6eeba6a041f9bb616913eaf64a9c6f0ca3858f3f5876fa9689c39e239 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01560.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01560.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8d4483e3bd044deccc07a8df1283d46c597d9d31 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01560.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0936504647903baa1adc27aab439682bfb183058251fedb9f04600448c2f4879 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01565.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01565.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b1bcb95bd5f5fdf7faabf55c387d8db799534b10 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01565.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:adef689728e66eac0f302ef6f09fab0cc4e27a9e7f1ba96817900d43a32963ad +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01570.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01570.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..945353017506ca0d13b05a79c19525371f17c57e --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01570.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f70bc0a3686346ff44b2feecefe4c7804f67f6da13eb05d753e87e9015bbfba2 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01575.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01575.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..80797423516999a6a3a636e8819d15035b2502fb --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01575.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1678f77e878867dbd54acce4cd5ffbc87c5b7513cf150b819dd0f18f9a7409a1 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01580.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01580.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e202fa49de9ebea4159957164913756c87e86834 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01580.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:132de3ee2c9fdc8ea8df90d34d5d19c51dcaf527430bb71c3118ff7f4050bbec +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01585.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01585.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..78d396ad3dbc7774166c49b0a9ba698b0dc8e84e --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01585.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b01ad1a67360917fb1ab34aec3148739321a2e08c5a97a27ca1b78f4796d943 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01590.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01590.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0eff0c6ee6e50eacff2af50c6243e9ca63ac67e4 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01590.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc51c46c4c0a2d221dca640c95c862decdd5e8bf14267663515f5637d3eab6ed +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01595.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01595.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f17b7e3b6f4a15fcd794cd2d23f8ca68dbcc3db3 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01595.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53336933901dfae7c73328879d5c3910a91305da26e5c9ec67a317b526849cbf +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01600.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01600.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5420dc8a0dabb37ad66aedc32c8389667a8943f8 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01600.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:915c84b733999738557a3af29036137ab7709206e1f1aa6c5c3ff711b290ff9a +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01605.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01605.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..71ba398c3b98e9c7caa10d4a2cec524fe3714a3d --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01605.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7de967a96751eae7db4fe8cb6d0195ec2fdb02463a8d266ec461e56e55f140a0 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01610.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01610.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..aba9410a1e4ff937efcb54bf0f3e28e355390045 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01610.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12c797516a41e7fda751f84fecab2f81bcfa24d8ebb771da57027e1ff43428aa +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01615.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01615.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..239c77cc032b4f80a04aa3020ce6c8e380659b19 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01615.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68c8f7bf421610e190e4e3682dfc349702c64d22705683eb2249af14cdb3d66e +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01620.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01620.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f19dcfabce943cf6991ddaccc4ed7727e5a70531 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01620.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34cd27afd57e8abe5ccac0064b8eb8c8b362b3d3610171d381d134be17c631f8 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01625.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01625.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2fa3904e4a1aa4695b8ab85ece62415628a383f4 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01625.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7f7bc5aeb975ccd0a3d5967d95892d60a7b218ecfc04cdb462d16774917ba23 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01630.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01630.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7796377eb44bd63f0b99a154376320be2576702e --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01630.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b6d25fc7e020f936b290b803eb8d5e953174153e0f83efbee02aa9514d0e4a6 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01635.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01635.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..515e482934a35b9db318e1cf97781168c4d937de --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01635.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7daeeee7c133bee146b22ef71be7dd30761fb3a3ce74dcd4ab3d4518a05c41a +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01640.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01640.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..964d47e425001b6d4623b01bf89a18c0b88e5f25 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01640.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af1bc6bd181da39915313ceecd06350f5606566426e3a69e411af5272b5fdb87 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01645.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01645.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..888938d3e2326720a59d233f6246872ec752eee4 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01645.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ca971a2e9246434d6bfe6919ea4be1f1af175b33d24caac296333dd0d3b4fe2 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01650.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01650.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3e33954ebcaa64ff135c6e9ed613ceb9c0199502 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01650.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc7bd418f71756c8908a9df3a72a08b0522654cfb1d0f3cc7d9faad3e100c9da +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01655.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01655.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3567e6505a13b4455f4825f56698eaa9624a82cd --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01655.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d71e8a07f8b719347df5f9c719365dc8f8dae8d1addf6d00c2bafe8283e8e77 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01660.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01660.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..fb2c98713792ead85b59b17232cbc51911788c2b --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01660.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54ad354a4dfa6519f9f4277c7fa9a8e00c2df7c9dd93aaef125da5eef847da34 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01665.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01665.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..76eb484714ecb5bf85264015d6ad675bea4ba94c --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01665.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e5d2ecd4917b6a100f716614b5406a818871aff857de0d56c0630ea7e839709 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01670.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01670.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ddfeaccc67578f220d79bcc66953140ae1e457b3 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01670.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5dbdb98310c4f487de80091eeb61869f8996adade155e31ae4cea8b9d973659 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01675.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01675.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5f0a73ae057e8a8b6cdd794a8b12fde132e7da76 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01675.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99c931dcf1c640f00a0d1d25bac45ffd30fc11cb4af8632f44e6042783e4cfb6 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01680.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01680.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..003f85be0e5de74be360e6fb7104ad570f04305f --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01680.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a81a67f3a3a324d11cc7005b451ec491893f18d315710c04b74e7e200b75c6ab +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01685.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01685.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..cdb5d14d48fee70a76af4df2bd91d261fd89a300 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01685.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f323765dcea82ed327da928f337647e657452e5a0539e8c71d2c936b0f66c3d4 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01690.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01690.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..268dd23194ab2b2f952b56fc6801b7ade59f8f3e --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01690.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48ceba9ea8d9d534757fcdf9e3bafa7966b06f8832ad123c989fc848a9a592c9 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01695.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01695.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b3abb82d311a89e678aaff98de3cf6d23b0149bd --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01695.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:009e5888cb5d47e8527b950d9b1ab5d6be669db64b6d35c7372b54d547ac2185 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01700.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01700.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..dac4623f32f7f9028a5a13ae5de9b775c44000c6 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01700.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a0ccd3b4927615f4264792b702134d3f224988b994863d34b638d84b8704c10 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01705.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01705.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f2f1e271ab4d31bdcf771730b41e59f7dd911688 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01705.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d41eb0207976e5f28f82418c2cd197660dfe83cef1f26c6a18feb4f93fe8faa +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01710.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01710.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b693784af4c361cc64faea4c055f40bc2d73642a --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01710.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce8d0a3ad86b57349fe6439120a8272f26add570cc84f0476dd569ab660a49e3 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01715.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01715.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a14df83a0ccc14b5facbabfcab23b837d9ef682a --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01715.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dacb7adbadc7d93e93c86de568b1401e4fb876839b614396828ad9be3378d8a1 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01720.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01720.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..308a2d6c608852824bce2049e758f2aa53acbb4d --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01720.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0ecdc7cd32cc7a5d8e8e9e16d2089c802771957494a22166b9951cc47d104fe +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01725.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01725.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8ac35184b64aec49d96f83653784feefdffc9eec --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01725.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f58a644bd6d4f97f5eca69f41737adba43ae24f3790b9a239c1b60f6565e6b3d +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01730.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01730.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e6d32620dde9f3caeccc4a038f51bbb3c4f94322 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01730.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1bb985b7af1b0e73f2ce984d07d0ec54ff7e6f00494f47bb7bc0e93a6f2307da +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01735.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01735.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1a0f2217d66ecd671869074bb102d1da2805aa8d --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01735.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:079268e9447c72787c1430dc990c489b8ba023860598c377585af07adeb34898 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01740.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01740.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e5a526bcf98db20e4f947baa5b1fe2a948f3b9f3 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01740.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d5a24daed2da9fc5c84f3e8ae3a2834e5605d687de2043c14a5552ad7505e0e +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01745.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01745.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f60ba1279aec398a1e252d77b8925cfb2e0b5cc3 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01745.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9127ebb034c736946cc32dfc559a05acfa1fbce6f3ec9fba569093601ab97968 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01750.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01750.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1107d95c495ab11cc32405187726a3b7ec1c1938 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01750.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2157a49cbe7361fc360dbdc72073af9f35ec384db4d9a98a6ed1e04bf3e5cf34 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01755.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01755.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b3e57ec84050649eaa6d38039a09b66a9d36dbf6 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01755.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83af2d4393431f3c47eb44a142485262d39ee507263d0e943c046704e6427405 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01760.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01760.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..baa29a7d443169f4408f514878048f74a8385b1d --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01760.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f3ddeaf21a14814ba270df9ff471ad747c7f0b86969a06259b369a1a8131dcb +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01765.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01765.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a5b2309498c7b2d5468f33f0367b869672d5041a --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01765.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d09cf1dce078ab507dbb0c0debd947b354aa473763ba89adb7eeefd94c0e25d +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01770.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01770.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3aeb921f4d7b3707ab5834798ffb67e2057e788f --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01770.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3502f1303313a9155b6dd10163693c2232ce8c5f0853557196b258cb2a555b4c +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01775.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01775.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..836b6ba5e34c536abd4df43acce55766fc202dd3 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01775.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a7c6d11b2dcfefc98de14fc311e191fc77690b78f0281783974ee19f91fd531 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01780.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01780.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..def511d5988bd83e2978366fc442b9318937a344 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01780.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8adcefe43704a3d48385e4794ff9d36f0b45b825a06cd934bd4e369fe02185f4 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01785.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01785.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5609889ebb8f05301b9093ee8915b64d52665ad0 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01785.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d17e36a59f5bd318dece2940627f06592d4c3a22da4ae64eca5687aeaa28dec +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01790.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01790.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9a7e7e25bdc52dfd99b5af9074e07a7a33225fac --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01790.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18ff275cf24e0c993709e0d75362a375478c904f39ab2fb58e746954fe72f60c +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01795.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01795.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..bcaa90d32bd2634116cfd2067cfba040dd01624e --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01795.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b191de87409439cd19814d3fd7e75eba904e3fc53aed42dc399ab2b3cefd93f +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01800.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01800.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..37139ff2974e30fbb1015d2591ec91ff593e965a --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01800.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9ab1ff545b9e25db7164b2cf2f6faaaaeda6c236cada99e4d3a697e726e2446 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01805.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01805.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a4964e2238c97f3ada34ad2749ee8ea39df9a181 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01805.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2fbce565be325005dcb21ca5371fbc04b8e6821172cf6c54fe3346182d19cc5 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01810.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01810.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4144deaf090222c0a2154f5dd25ba089d79611c6 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01810.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14b3b610fc2569a37c95deccf3c1103ddd3fe73d3ebe0e3eca99a5f24f3e26bf +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01815.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01815.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4480e5927d929e5f01c60dd88277e483b2ca2cdf --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01815.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7cb07d22619e9c8cf4c0268b9c25508663bea133359bca7de20dcebae9dcd4b0 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01820.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01820.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..06424df84c893456c2642d5c13f0b9f95f4dcbc7 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01820.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:169935bb30749e0b8388958e0023405964bb6b81f663ed3cd746a6140789b43a +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01825.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01825.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9a654e945421840d3ec4ce3e7143ad21a952c3bf --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01825.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:770e1bdb9f4d6c4fd000e936f6802250022e3c315e88eee1f59d612d32d6e894 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01830.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01830.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9ebc19865645937b2b81e1829e04cf385c96aec5 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01830.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c947935f9339eb0549faa345bfc484d4fc44a76faaf7c2ee1f29f1783ae808fc +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01835.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01835.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..35b630947db0a900650e13c17efe095f09618d7e --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01835.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cccf0b02ea3511a974afaf7f763a65716be6c698087c0da52721670cd9ff7d25 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01840.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01840.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3267f407bedac09efc959deb1321211930860c28 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01840.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e08e110fba674ae242c412a33fa08ca1b7099ce7f8ad188f6342b65f24682ee6 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01845.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01845.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f6054b7044035161c3046203c14e31a2cca25c6e --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01845.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:818fd47e938335d91f1177bc414b1b11adee2a1c7695c2d80e52d012a07c285b +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01850.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01850.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..167318e0c03ac9f1953c4dab64e945fd11eace83 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01850.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37930ce9a011710d3efb6c7c38363c8378bfe1dd281766960194b47d6488ae06 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01855.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01855.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2642cf553c2f613af72375e81ab773b47cfc4b00 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01855.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:486e9a0fa253bebe1656848aa60c7bd50f93ee56a60b517989e1adfe67392dff +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01860.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01860.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6327aa7bbd544c1e645b03c682ff208aa2fee2dc --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01860.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b066fc246273e467e54ee9f3e817455795300433ac16feb1f134bc2453811769 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01865.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01865.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4b80bea798d5275845544cc347d36ad90ba0b391 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01865.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc2d9d7ea3e049d453d8b90f325a18cd96774f38ddcf9983f48af26a73a47b7e +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01870.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01870.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..43f90e6913ff1b822f70666d12cbc94cc30d8d75 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01870.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b585e060b306fc52dedb6c942f953f8264f7cdbd8add7954070ee95415472b7 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01875.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01875.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2e149057798fcc02e70c2a06d35d6791adb61e0f --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01875.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2bb1aa889c2523d94f75f5eeb321f0c7d4f824e2c59d9347e028d655c160d808 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01880.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01880.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e23e4398d206ba2915b9b9ced5f6baf0098a74a9 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01880.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0714a572f19d76aad75255253fe1eeb9b63b7b94eee50c2d0a76b347ab54ced7 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01885.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01885.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4e4c11c137feddbf113e168189e867f6783cc3cc --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01885.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0780c400f84b9751462d177ee6a5bc4c81518e264d14929e1d11d5a4889695e3 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01890.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01890.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..140732721626f13069132b4400d10ca75ead99c9 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01890.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02e5501a05b46019f21a36c03431b08086d0bf73cd5421f28ea92cf71931f3a7 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01895.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01895.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..28d25195bd6a276e96c3e1b82ad35699a57b8950 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01895.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0d3fdd449706efae596262e3424993bbcc41953df42b99f8cbb1728e53bdd1a +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01900.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01900.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a4110adea0c217524e249630d938c5ae8076bc5e --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01900.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8adcf549523b74cd69770daec5f9f97a118ded500d6dc8c7300d2c0faa87da4 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01905.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01905.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..fa9f0c95cf415f4ae9d6350d6ac687ca04ba170b --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01905.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c26e687c40f4d37cb25501d2927fe05233b8e2426b7370bf7ad04e32041ea5f3 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01910.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01910.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..37481bc665cd520f22bdfc743455601215eab675 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01910.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ddb6ad6b62eef1588f482f4ce60d0118d5cc14599880c303b199eaf9ffc8610a +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01915.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01915.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4063f7f59682b7cd4fe5cdd4a1fac539c3eb9ae8 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01915.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a6df4d1df27f23a51adf0b02142cd4e5de88d0c3edd59ef91cc71202098c1c5 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01920.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01920.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ea220e571138f6c015dc7417905ab62374653a80 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01920.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb0a62c49010609861f060a5af7cf772c1c00c1dfb3540df57899e5b77e06455 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01925.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01925.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..dc968072e90d142e97c1b7262025c5bfe6c1bd4b --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01925.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12beb39dd617412f9f539fee64cba42bf2fefd8c6e94aca787688144261951c5 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01930.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01930.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e844fc6adadcca3932c72fa16153421706b18ef6 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01930.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c9e0e3a160441702b4c9129d05db70e0a4640208cfe5ac8d806b9ef34724d46 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01935.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01935.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..dff0650dd1c4bbf7e27ec439b702ffcf32c995d8 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01935.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:00b3231e150a72045acfee15dc9a9eefe356dd72cc0bf774036f53eed6537b75 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01940.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01940.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..62d78ebdfecfe51e3c4cae247211c7251c00d78e --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01940.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:468dd039b6a3143e380dff370c32f32b1a60d9cfced1c0368cd1ccc30e2413aa +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01945.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01945.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..50bd32721d23fb32d5ea4bc23f621922667b1d17 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01945.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:549aa66cec94be9763fdde2f3e89dedf4d18cea1308d709d77563960dddf08ad +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01950.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01950.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5a73784c0b691285bb8e4128324e05716c35ce97 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01950.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2060a3da5778e0ef22e8b9aa4abe56ddabff6ff25da4957dde7265527e86cb5 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01955.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01955.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1779a0030f6c46a477f75de1aed858b0be77e9d9 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01955.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53f33057b3a559b65deb6bfc38b0fb5742549eadc3f98143535570e711389e5e +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01960.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01960.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c144df52875aaba03df4902efe8507099613458e --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01960.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e76bd8ff5d6f6df74c63fa735bd37cbb3dfbd52ef0559b1c14645587bbe68e3 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01965.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01965.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..afd6f2c5f56955a93b72b51692be2900b464c653 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01965.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2cb2a03d86754fc8173451c3f32ec96e30e67d403371a5afa41f90ac520c2b0f +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01970.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01970.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..acc1778c9a5f443404c2a7d1f2ed42559a3162a7 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01970.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60e413bfffb3769cb7785f69eefe2b9796e1fde61238105330c1158a93db7b85 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01975.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01975.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..56d78ff2c6bea61ebba63d3666f884e397fec4f1 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01975.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d828ee4b239f87f60cab8a8784f7cc1ba9c631bc624ac3188d3b33c4b9723d7d +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01980.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01980.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..30a825536f0061d43a80b791d0fd14608727b497 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01980.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32793accbd0e776cea628da7b0574d70e34e62d0e445238ccf24d0f651382af4 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01985.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01985.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..df16fe19eeb6e1f5d977fd5c7ce4cf46ab4be6b4 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01985.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ac493ab3c20aef4387a60c9f835c9a2105d2d5843871940784b7b04ef0e8fd1 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01990.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01990.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6641692eaf5e0714b1d93cc7e9d117ee0f61f1c7 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01990.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e72be31d0a19781fc526fb8bccf3587831f2b203f13e26272dd80c470c3519f8 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01995.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01995.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..51f42c3e5b5acc871122fb7b6080a27e7f504ded --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_01995.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a805441fb8c7e68ce2d4fa7a30aecdabdd7320af55900d2922ab66f312191d5a +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02000.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02000.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b425c48355d0b8d30a0e29ea7f28d8bdf8a58669 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02000.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c3af492093410de188440761f7c64205a0ed1c730486dd80960ade9aee5a3f4 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02010.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02010.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7798dfe0c1fcb6f9369eebb82a4096c4709101b3 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02010.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76fac4bf85aa1a063f6933d148ecb0e9535853eec0dbbb743767a265932cb0f6 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02020.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02020.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..75760dba0b17075c6719e4027eb364ba219af0e1 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02020.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ffe455b8757715fa6d7b0abbf1bd10421375564f5de84a56165dc87180703a1 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02030.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02030.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..72cb754abb4c111893d79edd7e1da1ba6e7f8f4d --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02030.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:555cd899e90dd3d4b57f339e369a94135877d9d940fb13148a1896ffc1e6118d +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02040.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02040.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f3c7d72cd0a510a844b65f12c87bbb9b44d448f7 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02040.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf0d957739f7155c58a8047c178cc721423b88568bdc02a48f6716b602b00cee +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02050.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02050.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ccc50bdebf37ffd0113b707256405e10b12d9d53 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02050.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a9fcfd4c463bebfa949057bbb612f41652006d7776f042a09479b4d487c7910 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02060.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02060.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..dd737f055ec19beece79f09d157c72716a45c48f --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02060.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:820bcb2515c017a31ee0907b639640c6f451d5e70001a72c8684fde0f06bf971 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02070.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02070.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..60bfca3ccc83a09f1c77bbbf6947c34619374fcd --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02070.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93bd25aa710d4f0d0b368f18e263df3391957067b82188d878fe5321d13239cd +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02080.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02080.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..02b06284899ee0fbad237fe52feb44e315ca5f1c --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02080.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a8e301873bc720b024214d722f6b2d651f6f4480ce3149233e13aca0b6f3584 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02090.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02090.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9cfde5b5a4b2bb56cd44ac3f929e431d2f1c12cb --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02090.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7974f4f2d6afe09b7cbc8a19ab18b419bf205a2a3ab532b85082106f7a400a1 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02100.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02100.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7733d28850fd17f9c4d90150553b5e64e410bc99 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02100.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41da44ce271a804e751a922e3c1aba8a775f5638b43a7bcfbd5b8b7a653d5e2e +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02110.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02110.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1978a9bde9c3075ee7ec32f6bfde7e7ed0687abc --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02110.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:251943acf24897f19ec34292a5b0d8e1754e01ae94499e7c84879ee7b023d9f4 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02120.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02120.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..74c5bbf83f8a876374fdb9e96a231b9a21604b2a --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02120.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea38f898bcc2115f2d29d7dcfb119cb4e4279d6b92eb52761c65063991eadc9b +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02130.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02130.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2e2e1f754fc02e6023179353301a7611d9ce3e65 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02130.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46b9dd0d19793b88256e098a3ca441a6fceec9f6db3db2baa405b2f78eff1cea +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02140.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02140.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a052e8c287ef8c8c390fdd2b6934e0df6521497b --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02140.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8570c22119251b9ef5790e348a1771ea3768af76a91b0580f9b2b5f0f196b656 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02150.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02150.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1346670e989fb034e5757228d03f2384b2141acf --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02150.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb4a2bc32a5c83ce435a06c011d6c326f078888086b714874d05fbd4dd0b6b09 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02160.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02160.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0702b1449daf69d4ba05b6bb11a0c2cd08f58181 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02160.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:afc99aa4ff2a9b3b9c3397b970ef5ed059d5bb4f96d4c738a44294925f9c280c +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02170.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02170.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2e7e775d843103ac0e05bd74f16ccc91d407030e --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02170.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96c1591f63c0d1967dea978a7803e28e7ecca60112035bc5f80a346cd2374410 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02180.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02180.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a476f4eceadc3d2afb61eac5325c888888b3a0cb --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02180.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3c90382db55c188f2b36dccab400cdad15949d279162e65fdc89039db8e6aa3 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02190.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02190.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ae83d42ab8ef3c8c53da54296ce4f816844aa7a0 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02190.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:273efd07b0cd4fae4bf29a07778c235c3d1069d442403e192e621051a13bc652 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02200.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02200.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..be51c3f6ec75e4fb62229f5bb6cf609477761eaa --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02200.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36312471197f453ffa313e8e2739db9a4c97a37d3083fcae0a3b37c1bbeca5fb +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02210.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02210.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..42eefb74fd336ad5d5351dd406251deacd752fa1 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02210.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83ec3f127605b823b926be1ddc9b298bcd7b3e6a9ab5f52a23d322d7bc8c3e1b +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02220.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02220.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..296749e9da791a949cc6a915a704282c7a949f87 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02220.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:483b9e90205646e15e5ab529369b38695f955303a92dab2fe718212b9dcb8a3a +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02230.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02230.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9befaab009bb570da8a6ea4aa4f7ea24a44e1a75 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02230.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dae5603a8e1555dcc67b0bcc546d213b4c36089e34885630193dcecec797e67a +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02240.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02240.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9732f083af414c76a570def7daae1af95ffb98d5 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02240.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb6b43a4edf0ce518ab36ca46dc6de14849f789e2d68ce81cb029af6b6f23a2a +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02250.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02250.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ba3e9212db85ce566ba6a6ba46b190d357756513 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02250.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76ece6ad17f1a9d538614f17d706adf647d98bb76da859c1f62a910d66949ec4 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02260.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02260.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..46e9e328243a69300634885c1b63cc3e4dfddabb --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02260.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f895f0bcfc6d858e82d3e63a857ac07d703adab8d51443d440e5dac0d6f5c16d +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02270.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02270.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..94fbf9a16eff0255c32b58ddd13a73d49fa4a706 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02270.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:701a78bc43799a21f92cab87e7b312bb2f53792028d77ea6588339cf158c7f15 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02280.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02280.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..30b022cae934b58882e80cd38849126a7df5c51b --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02280.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5285efcf147a310d6a16127b357467a06cf72a84ea95b1387331cfda28b953e +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02290.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02290.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d1a6a11e5697f09a45fa2c6b533f0c72337f79fa --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02290.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0846941a81c046d6a3e2570ce51bfea2ded6c3e8d5fd33fe1a92d5637d13371e +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02300.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02300.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..07fd00ce3e90cb0efb6a7837d22e7ee06a839bd8 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02300.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56bc041ef4a231a324e4ed9be89e578e15af626ab3e5a077c3a299dc377eb2cd +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02310.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02310.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e5ce387afa7703fd104503f0e0f385e0ecf5805d --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02310.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f9adeb47afd2eb9ab2478d902d50a4f704aaf9f93334875d73c164e95f163fc +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02320.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02320.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..bcf2009c1b61654d7ff96424b3ee6be4a41b988f --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02320.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6208fa8be78caa4fad2011a3a563b85e022351196cb64f46252b63f501a64a1 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02330.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02330.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..be9c9396924d99c19077515ef16b57f3e92d7c95 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02330.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e6e2ed3440384c28f988dc6d69e4a2f4e78a95f7dc53499313f84bd36d490ba +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02340.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02340.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..41652b4f18925b2a960a25a37942560f95be9048 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02340.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc7f03033f5d9a1b614dd3964c0b84075041a18233c7c8ea030f098172133e24 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02350.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02350.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..741219d16686b0412fb59939758a1764ec82253e --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02350.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08d5b814f617a80734fe9440400f2a39c1edcf71d0f68fa51eb64d5555083ea9 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02360.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02360.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..037d3a07a0fec4a25c3b528a9402424f4e8df938 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02360.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2dd0ddda17f42c681faa679362a3a49b7c3674b0f901cda197077956fe690971 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02370.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02370.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d8385b5214401fec565ed6e57ddb70a32bbbac34 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02370.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be3736b83047a5cb3ce9c9181046e8d61a5f331b3d37cc7ea5a96c068a06e5c4 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02380.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02380.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5db80b9523e35f178535986b503a1f1614c5a4d2 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02380.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e37d21d481c700daa2b3d907b3c3546902960457abf944b2e8bdbf1c39cbbabe +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02390.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02390.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..858b87dcfda2ae6fd3491bf6f20eb11a7e9143c4 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02390.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97d0a1694e8f8093b1f6cd7513982af504946b62664b1391ca34af5858ca3169 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02400.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02400.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2c22b048867118636dc3a12645994839ca02e24d --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02400.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:167cbada474928593a1d91fe86a3e38e837ffa343b2bf8cea54cfd24e511d27f +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02410.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02410.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..be85d7fd6c75a2f2b2ee075d337d82aee29529b6 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02410.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76d4dc79ae4b9924a84abff4c81049f05b333fba35a6123c8194c98dbb1e0e1a +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02420.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02420.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2bb4bc5a094b0953dffe9c04613c55831b3391cc --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02420.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ace30f1d095ce180239742e11d497ecf118a342b0040e197308ca6f83262cb3 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02430.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02430.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..cc0e0873efe8a533570eb0200a793c895b9a2172 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02430.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b6f550df9c16014a829dd75cf7c0be9fecb6321b08293a8ccace52f84ff8e4c5 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02440.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02440.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d18548389c6dc13602ff0d1377017c02ecc50ce0 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02440.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d011c8e2a42153f021997e1e5e96433d6bdb2169c8e42ea982142e819ee9c911 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02450.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02450.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b06f86e91480ac890d8d899928a69f08a152010b --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02450.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:292e16d1b3cea4e432943606e77e96e8385efaf3c6a89eaa40e2eb8621a36d30 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02460.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02460.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..251b4d2543d66f151812553395d890ccb97fb5ac --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02460.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db277db72337186ae2196ceeabbb5d157425357b0e4bc3115937eac31475c93d +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02470.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02470.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..07932c308aa672a8da07c4c5f7e2c801348fb919 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02470.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0dccfdcdafe8f75a6cece0b4b65c1af656ce6e8d7fc86880a9177bbfa1ba08ef +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02480.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02480.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..92337739ab4affa39575427b1658718870f463a8 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02480.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74cb9724c833ef355a328acaa18dbca4eb5f17189f3b300fa45fae19b8c87696 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02490.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02490.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..fc575bda781124a3d898c6f57f519d55579e5d0a --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02490.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1b36d61a01b9b740e759cbff973fd6b8ae01d9ee37904bae1e0db3484501dae +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02500.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02500.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6639e23787cd33223e110a3efbc41a177e869180 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02500.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ce13761ff2701ea294332fb6ecb241bf51a0805f008ae515e840cb85bc5c727 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02510.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02510.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..be5f1d55ad8c4a964955ea9f640421cc62e3e4c6 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02510.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0dbd78b1c91178547c690b0214d1fbe69c29a00ec30a81de2ab588ae81701daa +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02520.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02520.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..37f41e855b7ee24fc9741cf4fc578745884f298c --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02520.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43f5a5e7241f330fbfe11d9e724ff8c035ddd457e542eecb081b1fcc4e92154d +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02530.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02530.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..57d7816dc71fc2d99eff11237bb74dcd510f27db --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02530.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17e522f5c9daa059dba40dee9576076659e5eb1cfd2e49598e2506a151520256 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02540.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02540.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6d0dfc78330666aff9036d8cef11e08a03fa0a23 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02540.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41523bea3588aca9bc19daae875caf11f46c5ecf869a70c5c7bff36cbba8995f +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02550.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02550.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6816b89a22b2a68f71a722bd13e8191352153dcd --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02550.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a67ac68bf6ed0838f03317010e12a3529ce7bb13272361d84508f786d109a454 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02560.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02560.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4f643813350461e390d90586b652ce8783f9add3 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02560.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f8f03d8affafd39c1494307d8b06eb8279f96aabac76da830f5fba6ff287804 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02570.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02570.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2f474d3e4c445512bb0ca60c19b538b7c3d898f9 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02570.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:def79049d222c8bed42fc098a0b63164d66eaba028edeab89b59a3fe1928a652 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02580.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02580.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..48632e32571e1cfb0f5e35c80164e5272717589d --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02580.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6367ea56342cec36be7abc58eeac420be937c70f3eefb2df4e2c2e06616370ed +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02590.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02590.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3354e74119de73b0ff11d6fc61c3a763801951fe --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02590.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80b3bfe96caca7577883658923b98d09162182cc31a56d75151abfa8ed37c4da +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02600.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02600.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..814402911b3e39880f88743fb965ee79dd983227 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02600.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55cc1f3cb96e117cab2e4fb85a2913bcd2e539d6f690e85bc6c78ddd83328944 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02610.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02610.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f9ae2180bb32c82f7eb79bb1bf846fb93db7733f --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02610.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:57d1aef65fd9284744d90cb396b471d6b21802a4f0d650c68fd82a6e30ecc153 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02620.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02620.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..118daad61d9a9a8b22ba5ae5a7d6b19bcdf87030 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02620.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1fd686916519db9d14265c065a8b5bbe73146362825b50933bfd4633a7cc232b +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02630.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02630.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d8ee394b960703dc15a4bc3b842b59bba964967a --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02630.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b728f0d3b3087243bfbbc345de217d8def3eb054930a5804a439199be65734a +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02640.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02640.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..22e2bf7cc541b898f5c9f3b90bbefc15158f270c --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02640.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec6aa849b3ad3828f96236bcb5d48c5e279a56534c1e16f2af752852dd944fca +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02650.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02650.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..142dc66d65c6facf8cf24aa3771db61cc9850d14 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02650.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9caad9ae6468f7a2678e7fc626880a9bbd618871433d090a0ead6c1040545df8 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02660.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02660.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8e9d75110876bde3152f01a388031373a1efb131 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02660.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a19e604f7bdee115ab0b850a1b9e35889ff83c72faa93de8fd84d329aa41c6d +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02670.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02670.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..66c234529b52aaf6ea4d2bce5c3bd6e47361b74b --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02670.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a77f28f6cfd5650a376575066affa9b9e1cce3d55a98fe3b9664823a0e33b575 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02680.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02680.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d03d0be9b39d75a0067afde28edc2f6b55682e7b --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02680.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35cff9aa74d0388dbf00a6e5e30ff856dc44640b1934cd47554e8ac519d749cf +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02690.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02690.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..59ddb9f423f9644c46af3e85bee667e8ec0c08d3 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02690.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e011f48875960d4448787997d3f9a320367a4aaadec33ff2cee6609214572e6d +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02700.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02700.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..68fecd6ea467f9f19c6ac745fde994f9b1fa2d8a --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02700.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91e0c68244e8f928dee0a782fb32375f5ecfe4cf1e708b56681adbb01d7fe740 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02710.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02710.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0653a8abc673e39fd79600c7cf4b919bf515464c --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02710.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:985c24062333cb85055e359d0b367940af589c4678851264b37ba545a72b9191 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02720.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02720.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..437416d9506634861537e1241ba852c97121921b --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02720.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:459a3c4949021c734ef2f8e984651aa9fe3a22bab7b2565fba0f3f2dda66c74a +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02730.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02730.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..67d67c62833f6f213d56bad1c5d8073ed9e8f824 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02730.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4be634fab25e7a3e5166f41d3c907142f902726cacc7078b415b1f91d9202b2b +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02740.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02740.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3dff6f1eab8c9223aaaf6027d406804790aa959b --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02740.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8992d928ee6e71172ea307f81d8b071dadbb3fd8996d577743ba050b9fa50c7c +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02750.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02750.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..22192ef7780402ad640d02ecdeb76c86ebf638ed --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02750.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45d2dfea687ea25816a57b0a1c22e614cc5ef72910eb0d2d34037a45d0bf5057 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02760.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02760.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a4b957a1077eb95385c69476f79a6ada0b4b39d8 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02760.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d784bb257a2208b5737a16b6b2f79a0078bdba29d195f643066367942fd748b +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02770.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02770.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..89e344411398a50f1eab980c6c9b669ca14f0b03 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02770.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9eea2fa0bb688b6bbeb465570e5dc4a7d8218272e71d7580ed67d8329077d69 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02780.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02780.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3d3fb9c9214301ab018f4e841a9fa0ef40fb9d67 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02780.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:047ead622bb59a724bf5f3e574227eaf7ff8a2a9d3e612b0483f21539d78deee +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02790.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02790.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..dac2360150eec9ee61968bae32645f8e4efc23d7 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02790.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac930f28b1ac92dc50f05859a64e0f27097f79bd93acbc528057be49444a37f1 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02800.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02800.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ec95d631e0e4f97899f8618e8f81ada204251c8d --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02800.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3de10bc4c33190416a3947911f53af668ac7d0462e7fbc065f07a45066dcbb55 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02810.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02810.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5ce20e0d33e4de6526628c1f273f2cde0626d2ae --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02810.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12f9ad57748b4b45a0d5cb706d9d37601afeaf92e4a5d0318b439098bf6dbfac +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02820.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02820.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..90c901fecfb291cf57d28d96bd4037e211637731 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02820.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e544ff43ac5c86eae4b0394e1c4e16d05a15c4e2db96af029d84f69ae81cff9 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02830.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02830.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e8202f211f6f82ef1c714690d7a7902e35731010 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02830.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a304be459e9e4977d3c6250f05b2951b3ed277df82dfaf712009caedbf46e5c +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02840.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02840.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..667a08109cc65b05cf36730d551ac44331ab8a0d --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02840.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c3a76cfabe1834832e9ba934d274ee9795096f86be96525c5d90ec280388456 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02850.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02850.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..42d77a55ef78d19a9cab4fff47f6d5311f2658bc --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02850.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f131fbc79cc8d3b55dc5491bc1197fb3dcb45cc5f035b69ef76570b61d073723 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02860.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02860.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..be775fa464d2948c97c98c21a820b6ba40d8ea1b --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02860.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29e178a0cd3ea3e8db374a29d61bf134c5d8160b6d9f43f9bc8c7c5b815092ec +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02870.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02870.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6cda55706543f29d86d53a79f932a5687522d9a8 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02870.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d33ed8226be2ab767ed5dc72e7f934a8f33fb8c57040d1a877b32cf6b8ae2225 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02880.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02880.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..86583e1fbaedb4e45de9447fac44001f94280a8e --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02880.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2fccc42657488a45095d048571ad8234370b30d88fe7bf7d7b54a829e557c0cb +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02890.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02890.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b6a8784fdf3940314ce72b636f9a3a2e54e5b279 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02890.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1f6701e2f6c1f9ae2e723eb7d1bd7ac0522691bf233f828626b9484ac31feaa +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02900.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02900.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0c55bd729c29fa0e5ae9bc7b2d2964eca3a65c02 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02900.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ced4b08bdef802ba00006bdcebb5a62aaca6a26fa761b8f2f80961438de40b9 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02910.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02910.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b544f3f047a7ab467229e39fa496233137da01da --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02910.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33df27aea64ea731fc0638a643406839629a86c5ec55965502e65ed72654f215 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02920.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02920.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..24f853bd049ebdcc42d3366aa16c63afe16e3ac4 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02920.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:caa419a807e5253d341efd71d36a8b890bebaa12e29d7cb335ed8615ae4e640a +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02930.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02930.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..223041a60a5cd66779954aabd22d67b7f9211d14 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02930.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cad7a9e64e691a89a31b83d096ddd85f422a252caeb1f237a863fd4d15a39ab6 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02940.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02940.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d34762c7d2eb515daafb4e32cbe0d361b1fb5bd3 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02940.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6fc76703d47b77fb271f56649a10d2b9c20a7c784a0c727683d137c2aa7ecb5b +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02950.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02950.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b1862be25571da23c43da5a01d10f261d7fc3729 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02950.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e69152270ab161c6989dd0f92b4faf7bef458fc3f2469fd8ec243d2c407640bc +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02960.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02960.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a4503326d56f952f15bf949b96c164fcec22f45b --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02960.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f558ae4ba813f31cbace10d630bbbb61eac4cfada8ce37a956d34f9591e22954 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02970.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02970.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..abf0aa3891aef3961ef0dd4ecf7895cf743bf391 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02970.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eebd4b7c20bf4e49ea5cb42f31994ba331a93612947792cb0ee53bb12731519a +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02980.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02980.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..01817c248e7e0a9c6ab847d365ad8d0c014848be --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02980.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a792e2728053a54dbd3e922d4dc71e58fbae9e5853f2ec8ada3121a56343f62 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02990.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02990.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c061be598ced3f91d101ed97cd3e358b5f55319b --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_02990.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45b572eb417cbf25f2cf97a97851e5d647125ac1d3ad36af1acb06df22df0684 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03000.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03000.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..cd9c12b4cb5814d45863c6a93f57df2c1c6301a0 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03000.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8da2f1fa56ce6b83a599368d1986d4e5bb99e7e7e58438ec3f773ca51f949df +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03010.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03010.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..063059b3a96d9b3c67da15b484b5c70a39e80de2 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03010.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16fca5789542748457896941cbdc6708a645b135b5596f257dbbdcf1511f8726 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03020.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03020.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3614a8a1dffa3f7de47fbae1db20e6f95835aefb --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03020.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21b621c323b2c93a699df56495d054c309ddf874206b9660ef60e6a59c3949bf +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03030.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03030.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d1246c7654d721946abf20a86b6c4f4fcd94c23c --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03030.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a48b77006fb2432d82bbc837967180ce811dceed2073f76c13fd67ef46edb7f8 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03040.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03040.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6734be20a745b6c9252c7c85303a3cdbc39c7655 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03040.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed23698098897394b2d0bd404b4310ddcc73ea088c3f1ed173f7824112330a7e +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03050.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03050.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0213968f1482e1606451d05b10e286ef0a151eb2 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03050.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d4cdbdd5e2db398e9b6a80ce3a1be9d1df084ee03b3d4524c92d2ea8aa44719 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03060.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03060.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b3005ae9e775449b1dec491ee51c7d0bd31707b5 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03060.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ee78d5caed441aab3f8fe1b4908899fa9e80b036768e7afb1caef7b4c35e605 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03070.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03070.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..cb3c91f434cbdfc4eac36a3c60deb59f1658e3e2 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03070.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c81d7e5548aea77c283a94037155cb9b32e0604e213492e9f3b01cf54cb961eb +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03080.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03080.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e25a3a7be6644d39f8f4a1e4ad26b195055369d5 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03080.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:157266984f3ae39dd73442bac8ed434b68e264059d0b489814c60ba2907a33b8 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03090.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03090.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5faef7fc0a398a7be2a12d1495fd184e3ae75592 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03090.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4edc70340cff9264620f6577e89470e5bbd6a68bb39fdc0e10bd075521d0fe22 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03100.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03100.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b8492cd27e3fd37928f3f7c4dcf669203c363b40 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03100.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:530e149085a81918b2f3d5e0bf117fb362e06c382414e848e4a8e8752f7b4fdf +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03110.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03110.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1a80448ecacf7b88566a17f31258f8c11115d4ab --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03110.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d592d0fdf73f5345939c0fbddb88130d9a70b1d23350e897640a4e8efdff0a8d +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03120.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03120.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..70a3b8343e23659ca8c509929b1eead4996ef88d --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03120.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f31f35ff4e9dbb921d9a26b419024c7d782045a3fdd52bbc641dfb888c7248a +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03130.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03130.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..bc8d4608221d3febdcc9f624c306c72285db574b --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03130.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:961f76bc3f71a5ec5b3aff46f4f6eea65bcb0134b83a38be702335672b7be81b +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03140.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03140.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..018a461dc49db9f30d2e43205ca38b6ccccb8bb5 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03140.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a1ee22cc5c72e67ce2b4b649d92fa36cdb243f8bd2e59adf47affbaa2c36deb +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03150.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03150.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..613cc64bf75d2363ab9fb65f24fed8d6a1ee73b3 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03150.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c96574965f9dc9c283561dfc2786275ffc5d9443157b2f9d20591071c65757c2 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03160.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03160.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..46977e05897b88ee0f3b9e34d303397c931e27be --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03160.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:466d0d339b7a84016242803cd0ed45dcb74ec179adbcf794368ff195bc73c491 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03170.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03170.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a14eb4b868b868781d0bc757d94e2ea984f89ad4 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03170.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7cc6e72e2e46a7ed53f2ed5033528f6ea29051f1eeecc98669b3bcd845f7bbb6 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03180.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03180.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..69bd818fe9eaadeb1d6f8ccb01ab7e460604c236 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03180.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8e1ba8efb794eaef2a82bcc28096eb876627f066cd1d2f3e9f52394d005e070 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03190.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03190.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..40050db07d10ea076dc7c04342888daa76eca612 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03190.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:250a22990e54bc360a61dd1a1a4d1e56293365a2d3ea39aba572e130e73bd667 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03200.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03200.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d07790300d4859b69c521d897c4ad7f7ded6ddd7 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03200.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a383fe08fc55a8d07c1e1361aa92947aed5ec3e6f7608d9b9178085481524c6e +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03210.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03210.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..81aee8944af8c57f79cd610e181eb948779bd850 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03210.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3466ec85f9807a4704454ac0499418a60454ff9adca0f685a45f7f329a71430e +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03220.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03220.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6f29011ba0fa8653b04800474d45e050766fd1c2 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03220.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb4fb062f10bd94edd7b9089be945231db00b2aee40eb65aaab1493a5b0f92a4 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03230.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03230.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..286ce14cf88239a0f83aa07091417af77293f35c --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03230.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f284e1719f6d4254a212bce769ae6508075c9065cb3b3a0e81860e40aca211c9 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03240.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03240.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..168d0a8573196c98a10d7a4c12bffe265d0a4202 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03240.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46ab5608e2b896c64d479488f6e370ed2e6e60eeb0c463bf068b70132512da12 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03250.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03250.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a1c49f048c83c965d835aa51bc96735125f384cc --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03250.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:47b535898bedc5c4f403b2d656f47910abc33971b1de8bfaab3e1d0a836cbf63 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03260.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03260.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3a29f3126acf61fa9893ca57246c902739340865 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03260.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19c7de394b693167d86a6f05d7ce3b92b4f3a785ba2649aca910e10689e14ec2 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03270.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03270.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f6a7c7750a4832cd72949ffcdc3e36392817237f --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03270.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92c2f8b954103ced3f36addc367d1001751b78cd7f5f9e9a61476269ccafefad +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03280.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03280.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e0ec6534f0c655ff900373b34a03540103500af4 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03280.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ec278c6e0c7d1889dc1654b8398a210f0da11cdd2f3858ac9a2cd6af5b15d24 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03290.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03290.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1ff4c4cdd09a493940460725a83954c4da915818 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03290.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:429c133f46a755e72890d95960765990302c77ccc1418a5a807d2134f6de76a9 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03300.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03300.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c1d7dd38e7dc0215cca16bb2bd11bc2776344f8b --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03300.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1abb2f8a7685fcfdd6473b40d8bc06210482e5e1bacd0f5a0b61e48a6ca7d6b0 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03310.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03310.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5e8135a66587fba9c40c20fccc5fe88cef5984e3 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03310.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:356ef18ca8a4a924b68242d4b72bed969c3d9ce46707fa8ec09c277f544bab69 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03320.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03320.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f2c5c77d20d9fc2f1daa5460d6ed738e658869a1 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03320.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16586aebdcc8d74a2c4fb4faa19ee317b78dccd0c70ba1d38e5f277ed3c48121 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03330.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03330.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6b1fa2f39caef514f69da433e64d42a1cd1316e1 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03330.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6fa0980a5a05f58170c10b9428f11af7f9485a6c0c5ab42bf9b335f303a78f7b +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03340.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03340.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..11f3d4e387d73623f33a13452705298cc4616ac8 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03340.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9981fd5df40fdbc994c0f94aaa75fddd2d33078de544f55480c246708275ba18 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03350.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03350.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3e899900db72a05febc8090a05807a2ad6435beb --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03350.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ededfe972c2082efb31e4c1c35d7be9190fb7b525155997f10105686618332cd +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03360.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03360.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7e52f70112e843b2eee145e3f63281df573dc57c --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03360.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:877abbbc45d8e588c65168042ba4b56a079aec1a9026261b005615cadd12cc91 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03370.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03370.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..834f8b79c3cb044c58593f3b1ae1f5206070b8fc --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03370.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ddd3ba585534f31ef9cb4fd89a4ddae20630c87b36958d6adfe7dcfda2af27a7 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03380.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03380.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..91cacc6b3d4cbc8e6934adcecbeeb47be97dcc8a --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03380.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30d88207a50ff0273676a9751ed1a0444eeaab06961649d8743b89b7194d3fe6 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03390.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03390.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..45998c4e2afa60341742e89df08043a57f595314 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03390.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54dc929194cb49b0a72c7548ff4bc9951fcc5ceff61a6d9918c4724b999d6130 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03400.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03400.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8d06286d40b00e24615f28bf53538dde04ea0698 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03400.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b917f0a76ea49cc4a68fc406dfc157b04c04a8fd79adcf338804f1ea232544fe +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03410.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03410.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5e409ff58b56d1d0dd3bd82b8ac0b1de76dc5488 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03410.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff44414f75cc719b1eee2a2b8af9bc8fd6b29e105c9c40da701ce79c9402334a +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03420.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03420.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a8ec635b5f87ee39312eae140ba6b699c24ec667 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03420.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:caa9189793255942cfd4028801d82b3ddcbf962007917d28851d92fda8920894 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03430.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03430.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e88f9215abbd7945bd2442dd2b3662581692243d --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03430.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:698e14a212439706e27217ad6818cebe0392d486710d864205f97a928af7a760 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03440.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03440.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e8344153425d83740431abe82a20a4bc4a573660 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03440.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26dc53b561ddfa74ffa5598d5251494106f61527a65ee7979cde97d5804f4dc0 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03450.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03450.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..364f7f8b646d5cdd48ec3a9364fa46adf640bdb1 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03450.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c887158c3a9d8c068eb0480dd3861ce5108b1fad68afded9204005efd7265fe5 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03460.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03460.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..09b518b985ccb06d99eeb8f11b3a59bfb2a5f501 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03460.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ee2eb00bf56bbe50c493795ffe79c2644a5a1fdee34ac1de69e3fb11ec289cc +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03470.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03470.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8c5ec595ad287e56044ae986e690f31e4f270623 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03470.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ce0fb4b0c3d90923e15b86c8541501c1bb26ea75d1175044dae7011d39b127f +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03480.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03480.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e3c4e854e8734f6ef73847f0f501e43afa867bac --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03480.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3ae306082ba74326c5e6a36574a233539802de048a6cb95d0f739bfa4d61d47 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03490.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03490.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7292795b997793505171961d38428c901f8bc904 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03490.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ddf8664e85b1208f7786f9870ee1277c69fe4f555dc7a4fa37a4ff8554564065 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03500.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03500.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c52669f7dcf0a178d9f0b1676c4b837534628ff5 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03500.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad2fbe7308f810ac8faa2a7dd2d4b6fff82f60e4c34b350a9b9b87dc9e1dbdf3 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03510.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03510.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..852b6d43c6b3551ef545552c58f96371d939c66b --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03510.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1472fbe16b83de24586df2d2cf29358caf3ae70e6e34ff9f9b22f0f35e9cc751 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03520.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03520.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..10080687b4cbde21cc117f98a295bdc9d901cbfe --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03520.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8728c6bb3713f19a5b02f9e7e99e57300212993bf6048c105861eb4ecacd6659 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03530.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03530.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..467386951375bd415cac6580b3705005bcc66d7e --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03530.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a14324586aec5c68f8cadc6a2f6d279106f64bd3d3d1a02087b5ec3718834fa4 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03540.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03540.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6cc97a5e2b0d667d00c64ad3ff4699d5474b39af --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03540.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:978c2e8ae8873072c3946ad26e289dcdc430df13e5fa4bb6deb2c63ba983b9ae +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03550.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03550.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7d17155316ca9d5073e1a73021e634d7c85fd186 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03550.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7db071ad9a2ecd2c6708b89220341339da7c1d457502b2642f9af37b8aaf86d9 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03560.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03560.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2a9bd483bf5c208dfe4650a6d19ea9e46c649744 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03560.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74e925246b5c40a1331f74508e7432406ca03ff7d0edc3937fc16b6f9c56e7d6 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03570.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03570.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c884f0dcb1eb67275b60143dedc19947177d5a32 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03570.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:623c91946e48f25a3fc0442c630de56c695669af913d8156afaf281cddccd51e +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03580.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03580.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..dc4db540b5f7dee5598d73fbc494296fb18e9591 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03580.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0460958184fb04f0512e5b1a7be1c02d7d1634fb48f1385b584d5bb6dc4b697e +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03590.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03590.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..31c4a08a55e8d6fd73a78b570ce0c09f87a0765b --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03590.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d2eb036faee6abb112e9917ef3c95a19e1c05defdfe40afcdb853d1b0e67790 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03600.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03600.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..03f911638c4ffc317c6516b24542a0c04a444fce --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03600.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c91459132b9f406e1b95cae1a7dcddcba43be33d34755a667a517667592113e +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03610.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03610.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..337f6f4f810833dfee052d980726371cf405338f --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03610.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0b1e6109b349eb4d4e157ad16b3898b512f85a3866d0f599e918e1268c12129 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03620.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03620.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c6107d96d1e3984182c2df9cc20377f44934002c --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03620.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da49ed55384732d65245ea363958b4c094e0ac4243540b8fb3ab5fb0435a8926 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03630.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03630.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a58a62b55d07c1f54bdf4d6661e01ed64d912c9d --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03630.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2fc8a5f012838aed4c09e2cfae7e4aaf7dd8a9aec200108a13558748a328a8a2 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03640.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03640.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0158705b6a6b276fbec4580c2c4b0f39e5d39106 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03640.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cdff69aeaa5a0de3e245fee5667cfa0259723b3d592e07aa8ba4b77552c676d2 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03650.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03650.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8ddbffb4f983b430ef43e024740a3cc7df36bcfc --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03650.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:add49947689419da069b16d6a865bd0cdc38c1ccbf5ecc587ee33c73b245290f +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03660.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03660.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c1ab09534a50bfec5c390286b2dd31487ca2032a --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03660.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d05b1c4b2051fadf58f437d8bad8793b47467a805bedba304aaca9c0301f4247 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03670.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03670.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..34e0d130f29cc6566e6b6207a278ebd49382abd3 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03670.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c358bda23d4ce8f26201b1c0251b6bcecbfa02f6f8c53e6c94fd00c7d5c1654 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03680.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03680.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..446fda3f992b7f70a02672a89c1c7cc238959cfa --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03680.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28b2c8ede672ca441189f8591cc329f5f0b424bf8e31226c856c1cfbf2fbd0d1 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03690.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03690.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..09ba80b235201f2572cb6f8472dd5d7ea6bccee5 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03690.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:384ab249bd07ca3016ee79396f6adaa9314391f978b4b809477de00195199239 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03700.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03700.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..258969bf9cd09a45e4d31b0e6ab976dbb7cf61b7 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03700.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3acc71588829309a3e82175f3185ce27a49dc5c39e71ee7733ebc4707a8a2cd +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03710.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03710.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c509441d2d3b0cb618427a56cc61c08653521768 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03710.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ef48a5ddd479e340f0d56da0c4bd5cf29b9474d8f49afcbdfc39f1ae6a107f0 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03720.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03720.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b5c124510e22fdc1ee8438733b8ec2fc4669bc4e --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03720.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b930d26e949038468efbcd70df0f980bbe1fc45352bf3113f312f590172e68fc +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03730.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03730.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5e061b7927bab98e7c659e1267190c16143cb2b1 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03730.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a8596ed1455e0642facb210b1ad09a7294fa4a931bcd48fa4af20aa0fffe2c4 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03740.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03740.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..991679c13033e9d3edfbf78cea3ae4d94097b9a0 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03740.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3058a672c8b82491b95637041258e6055119d482f472282891d2c6cd61400db2 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03750.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03750.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5c642a80382593c6adff5d8503b1e3d8cf5eb90c --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03750.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d15401fb48d0771f60c89ef16df0ce0b089c37a6bb37e1a1e02ba7bfeff44b1c +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03760.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03760.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b67fa39490b1a2a19af0de2260c329ef8ec507ca --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03760.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f08262a226d403ce74349d13d0d747cee8a09c7087a4b23cad0e02b406807874 +size 795208 diff --git a/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03770.safetensors b/al_0.6_g_0.97_id_11_seed_970611/checkpoints/ckpt_03770.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/al_0.6_g_0.97_id_11_seed_970611/config.cfg b/al_0.6_g_0.97_id_11_seed_970611/config.cfg new file mode 100644 index 0000000000000000000000000000000000000000..a349aa4b9d2451deded1d4ca5c651ff6b2461f7f --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/config.cfg @@ -0,0 +1,69 @@ +rl_action=train +num_rollout_steps=64 +lr=5e-05 +discount_rate=0.97 +eff_horizon=None +eval_every=1 +use_wandb=True +use_hf=True +use_log=True +num_total_env_steps=10000000000 +checkpoint=al_0.6_g_0.97_id_11_seed_970611 +render_sixel=False +sixel_idx=60 +seed=970611 +run_id=11 +seed_formula={int(discount_rate*100):02d}{int(alpha*10):02d}{run_id:02d} +mask_type=first_episode +penalize_time=False +optim=adam +live_monitor=False +use_bf16=False +deterministic=True +eval_schedule=0:1,250:2,500:5,2000:10 +grad_acc_per_chunk=5 +num_rollout_chunks=1 +cheese_loc=any +env_rule=None +env_layout=open +alpha=0.6 +env_size=13 +num_levels=9600 +f_str_ckpt=al_{alpha}_g_{discount_rate}_id_{run_id}_seed_{seed} +wandb_project=jaxgmg2_3phase_unique +ckpt_dir=jaxgmg2_3phase_unique +duplication_factor=-1 +smoke=False +compile=True +num_chains=6 +num_draws=3000 +num_steps_bw_draws=1 +on_policy=True +llc_nbeta=3000 +localization=10 +exact_solver_each_draw=False +llc_optimizer=sgld +iw_clip_eps=None +rmsprop_burnin_steps=20 +llc_data_file=llc_scan_open_reinforce.pkl +llc_checkpoint_index=None +llc_checkpoint_number=None +sink=None +repo_id=davidquarel/jaxgmg_ckpt_zip +use_shuffled_checkpoints=False +force_re_download=False +off_distribution_data=False +weight_restrictions=None +weight_restrictions_invert=False +evaluate_every_position=False +num_prev_actions=1 +ntfy=david_jaxgmg +vis_average_state=False +trim_episodes=True +use_prev_action=False +ckpt_path=jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611 +env_steps_per_loop=614400 +total_loops=16276 +eff_acc_steps=5 +env_steps_per_microbatch=122880 +chunk_size=9600 diff --git a/al_0.6_g_0.97_id_11_seed_970611/config.json b/al_0.6_g_0.97_id_11_seed_970611/config.json new file mode 100644 index 0000000000000000000000000000000000000000..425cfca6a5233eaf3edd31892fb9f20f8a8457e3 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/config.json @@ -0,0 +1,71 @@ +{ + "alpha": 0.6, + "checkpoint": "al_0.6_g_0.97_id_11_seed_970611", + "cheese_loc": "any", + "chunk_size": 9600, + "ckpt_dir": "jaxgmg2_3phase_unique", + "ckpt_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611", + "compile": true, + "deterministic": true, + "discount_rate": 0.97, + "duplication_factor": -1, + "eff_acc_steps": 5, + "eff_horizon": null, + "env_layout": "open", + "env_rule": null, + "env_size": 13, + "env_steps_per_loop": 614400, + "env_steps_per_microbatch": 122880, + "eval_every": 1, + "eval_schedule": "0:1,250:2,500:5,2000:10", + "evaluate_every_position": false, + "exact_solver_each_draw": false, + "f_str_ckpt": "al_{alpha}_g_{discount_rate}_id_{run_id}_seed_{seed}", + "force_re_download": false, + "grad_acc_per_chunk": 5, + "iw_clip_eps": null, + "live_monitor": false, + "llc_checkpoint_index": null, + "llc_checkpoint_number": null, + "llc_data_file": "llc_scan_open_reinforce.pkl", + "llc_nbeta": 3000, + "llc_optimizer": "sgld", + "localization": 10, + "lr": 5e-05, + "mask_type": "first_episode", + "ntfy": "david_jaxgmg", + "num_chains": 6, + "num_draws": 3000, + "num_levels": 9600, + "num_prev_actions": 1, + "num_rollout_chunks": 1, + "num_rollout_steps": 64, + "num_steps_bw_draws": 1, + "num_total_env_steps": 10000000000, + "off_distribution_data": false, + "on_policy": true, + "optim": "adam", + "penalize_time": false, + "render_sixel": false, + "repo_id": "davidquarel/jaxgmg_ckpt_zip", + "rl_action": "train", + "rmsprop_burnin_steps": 20, + "run_id": 11, + "seed": 970611, + "seed_formula": "{int(discount_rate*100):02d}{int(alpha*10):02d}{run_id:02d}", + "sink": null, + "sixel_idx": 60, + "smoke": false, + "total_loops": 16276, + "trim_episodes": true, + "use_bf16": false, + "use_hf": true, + "use_log": true, + "use_prev_action": false, + "use_shuffled_checkpoints": false, + "use_wandb": true, + "vis_average_state": false, + "wandb_project": "jaxgmg2_3phase_unique", + "weight_restrictions": null, + "weight_restrictions_invert": false +} \ No newline at end of file diff --git a/al_0.6_g_0.97_id_11_seed_970611/eval.jsonl b/al_0.6_g_0.97_id_11_seed_970611/eval.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..158258519fd0d2e29d248084650a19a292f11b7b --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/eval.jsonl @@ -0,0 +1,852 @@ +{"ts": "2026-01-29T21:25:57.740706Z", "loop": 0, "env_steps": 0, "exact_value_avg": 0.09582492709159851, "regret_dist": 0.7079524993896484, "regret_other_env": 0.7102985978126526, "regret_corner": 0.7044332027435303, "regret_row": 0.7088123559951782, "regret_any": 0.7102985978126526, "regret_bot": 0.7088576555252075, "value_dist": 0.09582492709159851, "value_other_env": 0.11925449222326279, "value_corner": 0.060680560767650604, "value_row": 0.08787668496370316, "value_any": 0.11925449222326279, "value_bot": 0.08783135563135147, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00000.png", "entropy": 1.3862764835357666} +{"ts": "2026-01-29T21:25:59.016902Z", "loop": 1, "env_steps": 614400, "exact_value_avg": 0.09614585340023041, "regret_dist": 0.707631528377533, "regret_other_env": 0.7102882862091064, "regret_corner": 0.7036463022232056, "regret_row": 0.7082434892654419, "regret_any": 0.7102882862091064, "regret_bot": 0.7094120383262634, "value_dist": 0.09614585340023041, "value_other_env": 0.11926480382680893, "value_corner": 0.06146742030978203, "value_row": 0.08844558894634247, "value_any": 0.11926480382680893, "value_bot": 0.08727709203958511, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00001.png", "entropy": 1.3862820863723755} +{"ts": "2026-01-29T21:26:00.230766Z", "loop": 2, "env_steps": 1228800, "exact_value_avg": 0.09645573794841766, "regret_dist": 0.7073216438293457, "regret_other_env": 0.7102785706520081, "regret_corner": 0.7028861045837402, "regret_row": 0.7077164053916931, "regret_any": 0.7102785706520081, "regret_bot": 0.7099159955978394, "value_dist": 0.09645573794841766, "value_other_env": 0.11927451938390732, "value_corner": 0.06222756206989288, "value_row": 0.08897266536951065, "value_any": 0.11927451938390732, "value_bot": 0.08677305281162262, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00002.png", "entropy": 1.3862847089767456} +{"ts": "2026-01-29T21:26:01.436844Z", "loop": 3, "env_steps": 1843200, "exact_value_avg": 0.09675722569227219, "regret_dist": 0.7070201635360718, "regret_other_env": 0.7102702260017395, "regret_corner": 0.7021449208259583, "regret_row": 0.7072080373764038, "regret_any": 0.7102702260017395, "regret_bot": 0.7103970050811768, "value_dist": 0.09675722569227219, "value_other_env": 0.11928284168243408, "value_corner": 0.06296878308057785, "value_row": 0.08948096632957458, "value_any": 0.11928284168243408, "value_bot": 0.0862920880317688, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00003.png", "entropy": 1.386284589767456} +{"ts": "2026-01-29T21:26:02.642410Z", "loop": 4, "env_steps": 2457600, "exact_value_avg": 0.09706153720617294, "regret_dist": 0.7067158222198486, "regret_other_env": 0.7102624773979187, "regret_corner": 0.7013956904411316, "regret_row": 0.7066870927810669, "regret_any": 0.7102624773979187, "regret_bot": 0.7108861207962036, "value_dist": 0.09706153720617294, "value_other_env": 0.11929057538509369, "value_corner": 0.06371797621250153, "value_row": 0.09000198543071747, "value_any": 0.11929057538509369, "value_bot": 0.08580297976732254, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00004.png", "entropy": 1.3862813711166382} +{"ts": "2026-01-29T21:26:03.846492Z", "loop": 5, "env_steps": 3072000, "exact_value_avg": 0.09736642241477966, "regret_dist": 0.7064108848571777, "regret_other_env": 0.7102541923522949, "regret_corner": 0.7006459832191467, "regret_row": 0.7061796188354492, "regret_any": 0.7102541923522949, "regret_bot": 0.7113545536994934, "value_dist": 0.09736642241477966, "value_other_env": 0.11929886043071747, "value_corner": 0.06446775794029236, "value_row": 0.09050944447517395, "value_any": 0.11929886043071747, "value_bot": 0.08533455431461334, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00005.png", "entropy": 1.3862757682800293} +{"ts": "2026-01-29T21:26:05.052930Z", "loop": 6, "env_steps": 3686400, "exact_value_avg": 0.09766560792922974, "regret_dist": 0.7061117887496948, "regret_other_env": 0.7102472186088562, "regret_corner": 0.6999086141586304, "regret_row": 0.7056698799133301, "regret_any": 0.7102472186088562, "regret_bot": 0.7118216753005981, "value_dist": 0.09766560792922974, "value_other_env": 0.11930589377880096, "value_corner": 0.0652051717042923, "value_row": 0.09101913124322891, "value_any": 0.11930589377880096, "value_bot": 0.08486735075712204, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00006.png", "entropy": 1.3862675428390503} +{"ts": "2026-01-29T21:26:06.271669Z", "loop": 7, "env_steps": 4300800, "exact_value_avg": 0.09795575588941574, "regret_dist": 0.7058216333389282, "regret_other_env": 0.7102437615394592, "regret_corner": 0.6991882920265198, "regret_row": 0.7051845788955688, "regret_any": 0.7102437615394592, "regret_bot": 0.7122724652290344, "value_dist": 0.09795575588941574, "value_other_env": 0.11930930614471436, "value_corner": 0.06592541188001633, "value_row": 0.09150448441505432, "value_any": 0.11930930614471436, "value_bot": 0.08441665023565292, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00007.png", "entropy": 1.3862571716308594} +{"ts": "2026-01-29T21:26:07.484643Z", "loop": 8, "env_steps": 4915200, "exact_value_avg": 0.09824348241090775, "regret_dist": 0.7055338621139526, "regret_other_env": 0.710242748260498, "regret_corner": 0.6984705328941345, "regret_row": 0.7047062516212463, "regret_any": 0.710242748260498, "regret_bot": 0.7127267122268677, "value_dist": 0.09824348241090775, "value_other_env": 0.11931031942367554, "value_corner": 0.06664322316646576, "value_row": 0.09198280423879623, "value_any": 0.11931031942367554, "value_bot": 0.08396238833665848, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00008.png", "entropy": 1.386244297027588} +{"ts": "2026-01-29T21:26:08.691765Z", "loop": 9, "env_steps": 5529600, "exact_value_avg": 0.09853767603635788, "regret_dist": 0.7052397131919861, "regret_other_env": 0.7102425694465637, "regret_corner": 0.6977353692054749, "regret_row": 0.7042359113693237, "regret_any": 0.7102425694465637, "regret_bot": 0.7131757736206055, "value_dist": 0.09853767603635788, "value_other_env": 0.11931052058935165, "value_corner": 0.06737839430570602, "value_row": 0.09245312213897705, "value_any": 0.11931052058935165, "value_bot": 0.08351331204175949, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00009.png", "entropy": 1.3862290382385254} +{"ts": "2026-01-29T21:26:09.896591Z", "loop": 10, "env_steps": 6144000, "exact_value_avg": 0.09883897751569748, "regret_dist": 0.7049384117126465, "regret_other_env": 0.7102426290512085, "regret_corner": 0.6969819664955139, "regret_row": 0.703749418258667, "regret_any": 0.7102426290512085, "regret_bot": 0.7136371731758118, "value_dist": 0.09883897751569748, "value_other_env": 0.11931046098470688, "value_corner": 0.06813173741102219, "value_row": 0.09293965250253677, "value_any": 0.11931046098470688, "value_bot": 0.08305192738771439, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00010.png", "entropy": 1.3862109184265137} +{"ts": "2026-01-29T21:26:11.099014Z", "loop": 11, "env_steps": 6758400, "exact_value_avg": 0.099153071641922, "regret_dist": 0.704624354839325, "regret_other_env": 0.7102439999580383, "regret_corner": 0.6961948275566101, "regret_row": 0.7032451629638672, "regret_any": 0.7102439999580383, "regret_bot": 0.7141120433807373, "value_dist": 0.099153071641922, "value_other_env": 0.11930917203426361, "value_corner": 0.06891891360282898, "value_row": 0.0934438705444336, "value_any": 0.11930917203426361, "value_bot": 0.08257696777582169, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00011.png", "entropy": 1.3861898183822632} +{"ts": "2026-01-29T21:26:12.303683Z", "loop": 12, "env_steps": 7372800, "exact_value_avg": 0.09948039054870605, "regret_dist": 0.7042970061302185, "regret_other_env": 0.7102464437484741, "regret_corner": 0.6953728199005127, "regret_row": 0.7027264833450317, "regret_any": 0.7102464437484741, "regret_bot": 0.7145959138870239, "value_dist": 0.09948039054870605, "value_other_env": 0.11930665373802185, "value_corner": 0.06974098086357117, "value_row": 0.09396251291036606, "value_any": 0.11930665373802185, "value_bot": 0.08209317922592163, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00012.png", "entropy": 1.3861651420593262} +{"ts": "2026-01-29T21:26:13.514111Z", "loop": 13, "env_steps": 7987200, "exact_value_avg": 0.09982045739889145, "regret_dist": 0.7039568424224854, "regret_other_env": 0.7102500796318054, "regret_corner": 0.6945170164108276, "regret_row": 0.7021943926811218, "regret_any": 0.7102500796318054, "regret_bot": 0.7150854468345642, "value_dist": 0.09982045739889145, "value_other_env": 0.11930298060178757, "value_corner": 0.07059666514396667, "value_row": 0.09449467062950134, "value_any": 0.11930298060178757, "value_bot": 0.08160357922315598, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00013.png", "entropy": 1.3861371278762817} +{"ts": "2026-01-29T21:26:14.724583Z", "loop": 14, "env_steps": 8601600, "exact_value_avg": 0.10017023980617523, "regret_dist": 0.7036070823669434, "regret_other_env": 0.7102552652359009, "regret_corner": 0.6936348080635071, "regret_row": 0.7016602158546448, "regret_any": 0.7102552652359009, "regret_bot": 0.7155731916427612, "value_dist": 0.10017023980617523, "value_other_env": 0.1192978024482727, "value_corner": 0.07147889584302902, "value_row": 0.0950288251042366, "value_any": 0.1192978024482727, "value_bot": 0.08111587166786194, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00014.png", "entropy": 1.3861051797866821} +{"ts": "2026-01-29T21:26:15.929380Z", "loop": 15, "env_steps": 9216000, "exact_value_avg": 0.10053499042987823, "regret_dist": 0.7032424211502075, "regret_other_env": 0.7102628350257874, "regret_corner": 0.6927116513252258, "regret_row": 0.7011091709136963, "regret_any": 0.7102628350257874, "regret_bot": 0.7160727381706238, "value_dist": 0.10053499042987823, "value_other_env": 0.119290292263031, "value_corner": 0.07240202277898788, "value_row": 0.09557989239692688, "value_any": 0.119290292263031, "value_bot": 0.08061633259057999, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00015.png", "entropy": 1.3860688209533691} +{"ts": "2026-01-29T21:26:17.131668Z", "loop": 16, "env_steps": 9830400, "exact_value_avg": 0.10091409832239151, "regret_dist": 0.7028632760047913, "regret_other_env": 0.710272490978241, "regret_corner": 0.6917493343353271, "regret_row": 0.7005309462547302, "regret_any": 0.710272490978241, "regret_bot": 0.7165924906730652, "value_dist": 0.10091409832239151, "value_other_env": 0.11928058415651321, "value_corner": 0.07336436212062836, "value_row": 0.09615810960531235, "value_any": 0.11928058415651321, "value_bot": 0.08009655773639679, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00016.png", "entropy": 1.3860276937484741} +{"ts": "2026-01-29T21:26:18.336201Z", "loop": 17, "env_steps": 10444800, "exact_value_avg": 0.10131064057350159, "regret_dist": 0.7024667263031006, "regret_other_env": 0.7102845907211304, "regret_corner": 0.6907398700714111, "regret_row": 0.6999323964118958, "regret_any": 0.7102845907211304, "regret_bot": 0.7171241044998169, "value_dist": 0.10131064057350159, "value_other_env": 0.11926846951246262, "value_corner": 0.07437389343976974, "value_row": 0.09675662219524384, "value_any": 0.11926846951246262, "value_bot": 0.07956494390964508, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00017.png", "entropy": 1.3859814405441284} +{"ts": "2026-01-29T21:26:19.544394Z", "loop": 18, "env_steps": 11059200, "exact_value_avg": 0.1017226055264473, "regret_dist": 0.7020548582077026, "regret_other_env": 0.7102987766265869, "regret_corner": 0.6896888017654419, "regret_row": 0.6993140578269958, "regret_any": 0.7102987766265869, "regret_bot": 0.7176704406738281, "value_dist": 0.1017226055264473, "value_other_env": 0.11925432831048965, "value_corner": 0.07542501389980316, "value_row": 0.09737499803304672, "value_any": 0.11925432831048965, "value_bot": 0.07901860028505325, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00018.png", "entropy": 1.3859294652938843} +{"ts": "2026-01-29T21:26:20.750471Z", "loop": 19, "env_steps": 11673600, "exact_value_avg": 0.10215094685554504, "regret_dist": 0.7016264200210571, "regret_other_env": 0.7103133797645569, "regret_corner": 0.6885960102081299, "regret_row": 0.6986786723136902, "regret_any": 0.7103133797645569, "regret_bot": 0.7182262539863586, "value_dist": 0.10215094685554504, "value_other_env": 0.11923978477716446, "value_corner": 0.07651767879724503, "value_row": 0.09801039844751358, "value_any": 0.11923978477716446, "value_bot": 0.07846275717020035, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00019.png", "entropy": 1.3858721256256104} +{"ts": "2026-01-29T21:26:21.958664Z", "loop": 20, "env_steps": 12288000, "exact_value_avg": 0.10260061919689178, "regret_dist": 0.7011767625808716, "regret_other_env": 0.7103291749954224, "regret_corner": 0.6874481439590454, "regret_row": 0.6980151534080505, "regret_any": 0.7103291749954224, "regret_bot": 0.7187998294830322, "value_dist": 0.10260061919689178, "value_other_env": 0.1192239299416542, "value_corner": 0.07766564935445786, "value_row": 0.098673976957798, "value_any": 0.1192239299416542, "value_bot": 0.07788918912410736, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00020.png", "entropy": 1.3858081102371216} +{"ts": "2026-01-29T21:26:23.164854Z", "loop": 21, "env_steps": 12902400, "exact_value_avg": 0.10307301580905914, "regret_dist": 0.7007043361663818, "regret_other_env": 0.7103474140167236, "regret_corner": 0.6862396597862244, "regret_row": 0.6973276734352112, "regret_any": 0.7103474140167236, "regret_bot": 0.7193887233734131, "value_dist": 0.10307301580905914, "value_other_env": 0.11920563131570816, "value_corner": 0.07887408882379532, "value_row": 0.09936138242483139, "value_any": 0.11920563131570816, "value_bot": 0.07730033248662949, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00021.png", "entropy": 1.3857365846633911} +{"ts": "2026-01-29T21:26:24.376835Z", "loop": 22, "env_steps": 13516800, "exact_value_avg": 0.10356422513723373, "regret_dist": 0.7002131938934326, "regret_other_env": 0.7103674411773682, "regret_corner": 0.6849817037582397, "regret_row": 0.6966142654418945, "regret_any": 0.7103674411773682, "regret_bot": 0.7199950218200684, "value_dist": 0.10356422513723373, "value_other_env": 0.11918569356203079, "value_corner": 0.08013201504945755, "value_row": 0.10007475316524506, "value_any": 0.11918569356203079, "value_bot": 0.07669401913881302, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00022.png", "entropy": 1.3856571912765503} +{"ts": "2026-01-29T21:26:25.579391Z", "loop": 23, "env_steps": 14131200, "exact_value_avg": 0.1040799617767334, "regret_dist": 0.6996974349021912, "regret_other_env": 0.7103870511054993, "regret_corner": 0.6836629509925842, "regret_row": 0.6958726644515991, "regret_any": 0.7103870511054993, "regret_bot": 0.720613420009613, "value_dist": 0.1040799617767334, "value_other_env": 0.1191660687327385, "value_corner": 0.08145078271627426, "value_row": 0.10081641376018524, "value_any": 0.1191660687327385, "value_bot": 0.07607563585042953, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00023.png", "entropy": 1.3855698108673096} +{"ts": "2026-01-29T21:26:26.782397Z", "loop": 24, "env_steps": 14745600, "exact_value_avg": 0.10462667047977448, "regret_dist": 0.6991506814956665, "regret_other_env": 0.7104064226150513, "regret_corner": 0.6822670698165894, "regret_row": 0.6950931549072266, "regret_any": 0.7104064226150513, "regret_bot": 0.7212496995925903, "value_dist": 0.10462667047977448, "value_other_env": 0.11914670467376709, "value_corner": 0.08284662663936615, "value_row": 0.10159585624933243, "value_any": 0.11914670467376709, "value_bot": 0.07543937116861343, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00024.png", "entropy": 1.3854724168777466} +{"ts": "2026-01-29T21:26:27.985042Z", "loop": 25, "env_steps": 15360000, "exact_value_avg": 0.10519839823246002, "regret_dist": 0.6985790729522705, "regret_other_env": 0.7104317545890808, "regret_corner": 0.6807999014854431, "regret_row": 0.694290280342102, "regret_any": 0.7104317545890808, "regret_bot": 0.7219082117080688, "value_dist": 0.10519839823246002, "value_other_env": 0.11912142485380173, "value_corner": 0.08431385457515717, "value_row": 0.10239879041910172, "value_any": 0.11912142485380173, "value_bot": 0.07478083670139313, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00025.png", "entropy": 1.3853639364242554} +{"ts": "2026-01-29T21:26:29.186680Z", "loop": 26, "env_steps": 15974400, "exact_value_avg": 0.10580776631832123, "regret_dist": 0.6979695558547974, "regret_other_env": 0.7104641795158386, "regret_corner": 0.6792275905609131, "regret_row": 0.6934393644332886, "regret_any": 0.7104641795158386, "regret_bot": 0.7226106524467468, "value_dist": 0.10580776631832123, "value_other_env": 0.11908887326717377, "value_corner": 0.08588609844446182, "value_row": 0.10324973613023758, "value_any": 0.11908887326717377, "value_bot": 0.07407842576503754, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00026.png", "entropy": 1.3852423429489136} +{"ts": "2026-01-29T21:26:30.391508Z", "loop": 27, "env_steps": 16588800, "exact_value_avg": 0.10646617412567139, "regret_dist": 0.697311282157898, "regret_other_env": 0.7105018496513367, "regret_corner": 0.6775252819061279, "regret_row": 0.692543625831604, "regret_any": 0.7105018496513367, "regret_bot": 0.7233472466468811, "value_dist": 0.10646617412567139, "value_other_env": 0.11905130743980408, "value_corner": 0.08758845925331116, "value_row": 0.10414545983076096, "value_any": 0.11905130743980408, "value_bot": 0.07334177196025848, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00027.png", "entropy": 1.3851048946380615} +{"ts": "2026-01-29T21:26:31.597513Z", "loop": 28, "env_steps": 17203200, "exact_value_avg": 0.10716836899518967, "regret_dist": 0.6966090202331543, "regret_other_env": 0.7105440497398376, "regret_corner": 0.6757063865661621, "regret_row": 0.6915906667709351, "regret_any": 0.7105440497398376, "regret_bot": 0.7241244316101074, "value_dist": 0.10716836899518967, "value_other_env": 0.11900904029607773, "value_corner": 0.08940735459327698, "value_row": 0.10509839653968811, "value_any": 0.11900904029607773, "value_bot": 0.07256462424993515, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00028.png", "entropy": 1.3849505186080933} +{"ts": "2026-01-29T21:26:32.799287Z", "loop": 29, "env_steps": 17817600, "exact_value_avg": 0.10791964083909988, "regret_dist": 0.6958577036857605, "regret_other_env": 0.7105910181999207, "regret_corner": 0.6737577319145203, "regret_row": 0.6905810236930847, "regret_any": 0.7105910181999207, "regret_bot": 0.7249384522438049, "value_dist": 0.10791964083909988, "value_other_env": 0.11896207183599472, "value_corner": 0.09135597944259644, "value_row": 0.10610806941986084, "value_any": 0.11896207183599472, "value_bot": 0.07175055891275406, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00029.png", "entropy": 1.3847769498825073} +{"ts": "2026-01-29T21:26:34.003398Z", "loop": 30, "env_steps": 18432000, "exact_value_avg": 0.10872451215982437, "regret_dist": 0.6950529217720032, "regret_other_env": 0.7106446623802185, "regret_corner": 0.6716652512550354, "regret_row": 0.6895212531089783, "regret_any": 0.7106446623802185, "regret_bot": 0.7257876992225647, "value_dist": 0.10872451215982437, "value_other_env": 0.11890847980976105, "value_corner": 0.09344854950904846, "value_row": 0.10716778039932251, "value_any": 0.11890847980976105, "value_bot": 0.07090133428573608, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00030.png", "entropy": 1.3845818042755127} +{"ts": "2026-01-29T21:26:35.208169Z", "loop": 31, "env_steps": 19046400, "exact_value_avg": 0.10959068685770035, "regret_dist": 0.6941866874694824, "regret_other_env": 0.710706889629364, "regret_corner": 0.6694062948226929, "regret_row": 0.6883974075317383, "regret_any": 0.710706889629364, "regret_bot": 0.7266824245452881, "value_dist": 0.10959068685770035, "value_other_env": 0.11884617805480957, "value_corner": 0.09570743888616562, "value_row": 0.10829156637191772, "value_any": 0.11884617805480957, "value_bot": 0.07000663876533508, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00031.png", "entropy": 1.3843610286712646} +{"ts": "2026-01-29T21:26:36.413283Z", "loop": 32, "env_steps": 19660800, "exact_value_avg": 0.11052142083644867, "regret_dist": 0.6932559013366699, "regret_other_env": 0.7107770442962646, "regret_corner": 0.6669741868972778, "regret_row": 0.6872072219848633, "regret_any": 0.7107770442962646, "regret_bot": 0.7276178598403931, "value_dist": 0.11052142083644867, "value_other_env": 0.11877600848674774, "value_corner": 0.09813951700925827, "value_row": 0.10948183387517929, "value_any": 0.11877600848674774, "value_bot": 0.06907123327255249, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00032.png", "entropy": 1.3841133117675781} +{"ts": "2026-01-29T21:26:37.617935Z", "loop": 33, "env_steps": 20275200, "exact_value_avg": 0.11151846498250961, "regret_dist": 0.6922589540481567, "regret_other_env": 0.710856020450592, "regret_corner": 0.6643632054328918, "regret_row": 0.6859562993049622, "regret_any": 0.710856020450592, "regret_bot": 0.7285887598991394, "value_dist": 0.11151846498250961, "value_other_env": 0.11869708448648453, "value_corner": 0.10075052827596664, "value_row": 0.11073276400566101, "value_any": 0.11869708448648453, "value_bot": 0.06810029596090317, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00033.png", "entropy": 1.3838356733322144} +{"ts": "2026-01-29T21:26:38.820086Z", "loop": 34, "env_steps": 20889600, "exact_value_avg": 0.11258533596992493, "regret_dist": 0.6911920309066772, "regret_other_env": 0.7109430432319641, "regret_corner": 0.6615654826164246, "regret_row": 0.6846542358398438, "regret_any": 0.7109430432319641, "regret_bot": 0.7295903563499451, "value_dist": 0.11258533596992493, "value_other_env": 0.11861006915569305, "value_corner": 0.10354822874069214, "value_row": 0.11203481256961823, "value_any": 0.11861006915569305, "value_bot": 0.06709868460893631, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00034.png", "entropy": 1.383526086807251} +{"ts": "2026-01-29T21:26:40.022859Z", "loop": 35, "env_steps": 21504000, "exact_value_avg": 0.113688163459301, "regret_dist": 0.690089225769043, "regret_other_env": 0.7110384106636047, "regret_corner": 0.6586653590202332, "regret_row": 0.6833341717720032, "regret_any": 0.7110384106636047, "regret_bot": 0.730596125125885, "value_dist": 0.113688163459301, "value_other_env": 0.11851465702056885, "value_corner": 0.10644841939210892, "value_row": 0.1133548840880394, "value_any": 0.11851465702056885, "value_bot": 0.06609293818473816, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00035.png", "entropy": 1.3831918239593506} +{"ts": "2026-01-29T21:26:41.227529Z", "loop": 36, "env_steps": 22118400, "exact_value_avg": 0.11486932635307312, "regret_dist": 0.6889081001281738, "regret_other_env": 0.7111445665359497, "regret_corner": 0.6555532813072205, "regret_row": 0.6819345951080322, "regret_any": 0.7111445665359497, "regret_bot": 0.7316409945487976, "value_dist": 0.11486932635307312, "value_other_env": 0.11840859055519104, "value_corner": 0.10956041514873505, "value_row": 0.11475446075201035, "value_any": 0.11840859055519104, "value_bot": 0.06504806131124496, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00036.png", "entropy": 1.3828192949295044} +{"ts": "2026-01-29T21:26:42.433001Z", "loop": 37, "env_steps": 22732800, "exact_value_avg": 0.11613787710666656, "regret_dist": 0.6876395344734192, "regret_other_env": 0.7112630605697632, "regret_corner": 0.6522042155265808, "regret_row": 0.68044114112854, "regret_any": 0.7112630605697632, "regret_bot": 0.7327359914779663, "value_dist": 0.11613787710666656, "value_other_env": 0.11829009652137756, "value_corner": 0.11290954053401947, "value_row": 0.11624793708324432, "value_any": 0.11829009652137756, "value_bot": 0.06395304948091507, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00037.png", "entropy": 1.3823999166488647} +{"ts": "2026-01-29T21:26:43.636700Z", "loop": 38, "env_steps": 23347200, "exact_value_avg": 0.1175159215927124, "regret_dist": 0.6862614154815674, "regret_other_env": 0.7113961577415466, "regret_corner": 0.6485593318939209, "regret_row": 0.6788301467895508, "regret_any": 0.7113961577415466, "regret_bot": 0.7338974475860596, "value_dist": 0.1175159215927124, "value_other_env": 0.11815696954727173, "value_corner": 0.11655434221029282, "value_row": 0.11785893887281418, "value_any": 0.11815696954727173, "value_bot": 0.06279159337282181, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00038.png", "entropy": 1.3819247484207153} +{"ts": "2026-01-29T21:26:44.838040Z", "loop": 39, "env_steps": 23961600, "exact_value_avg": 0.11901451647281647, "regret_dist": 0.6847628355026245, "regret_other_env": 0.7115461230278015, "regret_corner": 0.6445879340171814, "regret_row": 0.6771026253700256, "regret_any": 0.7115461230278015, "regret_bot": 0.7351263761520386, "value_dist": 0.11901451647281647, "value_other_env": 0.11800697445869446, "value_corner": 0.12052582949399948, "value_row": 0.11958643049001694, "value_any": 0.11800697445869446, "value_bot": 0.06156272068619728, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00039.png", "entropy": 1.381386160850525} +{"ts": "2026-01-29T21:26:46.040976Z", "loop": 40, "env_steps": 24576000, "exact_value_avg": 0.12063859403133392, "regret_dist": 0.6831387281417847, "regret_other_env": 0.7117156982421875, "regret_corner": 0.6402733325958252, "regret_row": 0.6752667427062988, "regret_any": 0.7117156982421875, "regret_bot": 0.7364131808280945, "value_dist": 0.12063859403133392, "value_other_env": 0.11783738434314728, "value_corner": 0.12484040856361389, "value_row": 0.12142232805490494, "value_any": 0.11783738434314728, "value_bot": 0.060275886207818985, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00040.png", "entropy": 1.380777359008789} +{"ts": "2026-01-29T21:26:47.243824Z", "loop": 41, "env_steps": 25190400, "exact_value_avg": 0.12239676713943481, "regret_dist": 0.6813806295394897, "regret_other_env": 0.7119086980819702, "regret_corner": 0.6355883479118347, "regret_row": 0.6733177900314331, "regret_any": 0.7119086980819702, "regret_bot": 0.7377517223358154, "value_dist": 0.12239676713943481, "value_other_env": 0.11764436960220337, "value_corner": 0.12952536344528198, "value_row": 0.12337127327919006, "value_any": 0.11764436960220337, "value_bot": 0.058937303721904755, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00041.png", "entropy": 1.3800876140594482} +{"ts": "2026-01-29T21:26:48.445155Z", "loop": 42, "env_steps": 25804800, "exact_value_avg": 0.12432008236646652, "regret_dist": 0.6794573068618774, "regret_other_env": 0.7121258974075317, "regret_corner": 0.630454421043396, "regret_row": 0.6712066531181335, "regret_any": 0.7121258974075317, "regret_bot": 0.7391718626022339, "value_dist": 0.12432008236646652, "value_other_env": 0.11742723733186722, "value_corner": 0.13465933501720428, "value_row": 0.1254824548959732, "value_any": 0.11742723733186722, "value_bot": 0.057517170906066895, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00042.png", "entropy": 1.3793009519577026} +{"ts": "2026-01-29T21:26:49.648640Z", "loop": 43, "env_steps": 26419200, "exact_value_avg": 0.12643879652023315, "regret_dist": 0.6773385405540466, "regret_other_env": 0.7123717069625854, "regret_corner": 0.6247888207435608, "regret_row": 0.668921709060669, "regret_any": 0.7123717069625854, "regret_bot": 0.7406740188598633, "value_dist": 0.12643879652023315, "value_other_env": 0.11718139797449112, "value_corner": 0.14032487571239471, "value_row": 0.12776732444763184, "value_any": 0.11718139797449112, "value_bot": 0.05601508170366287, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00043.png", "entropy": 1.3783979415893555} +{"ts": "2026-01-29T21:26:50.850577Z", "loop": 44, "env_steps": 27033600, "exact_value_avg": 0.12876269221305847, "regret_dist": 0.6750146746635437, "regret_other_env": 0.7126509547233582, "regret_corner": 0.6185601949691772, "regret_row": 0.6664764881134033, "regret_any": 0.7126509547233582, "regret_bot": 0.7422462701797485, "value_dist": 0.12876269221305847, "value_other_env": 0.11690212041139603, "value_corner": 0.14655353128910065, "value_row": 0.13021253049373627, "value_any": 0.11690212041139603, "value_bot": 0.054442815482616425, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00044.png", "entropy": 1.3773627281188965} +{"ts": "2026-01-29T21:26:52.051244Z", "loop": 45, "env_steps": 27648000, "exact_value_avg": 0.13129501044750214, "regret_dist": 0.6724823713302612, "regret_other_env": 0.7129663228988647, "regret_corner": 0.611756443977356, "regret_row": 0.6638903021812439, "regret_any": 0.7129663228988647, "regret_bot": 0.7438764572143555, "value_dist": 0.13129501044750214, "value_other_env": 0.11658678203821182, "value_corner": 0.1533573418855667, "value_row": 0.13279874622821808, "value_any": 0.11658678203821182, "value_bot": 0.052812591195106506, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00045.png", "entropy": 1.3761786222457886} +{"ts": "2026-01-29T21:26:53.254830Z", "loop": 46, "env_steps": 28262400, "exact_value_avg": 0.13406091928482056, "regret_dist": 0.669716477394104, "regret_other_env": 0.7133222222328186, "regret_corner": 0.6043078303337097, "regret_row": 0.661116898059845, "regret_any": 0.7133222222328186, "regret_bot": 0.7455779910087585, "value_dist": 0.13406091928482056, "value_other_env": 0.11623086780309677, "value_corner": 0.16080597043037415, "value_row": 0.1355721652507782, "value_any": 0.11623086780309677, "value_bot": 0.05111107602715492, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00046.png", "entropy": 1.3748263120651245} +{"ts": "2026-01-29T21:26:54.456976Z", "loop": 47, "env_steps": 28876800, "exact_value_avg": 0.13708607852458954, "regret_dist": 0.6666913032531738, "regret_other_env": 0.7137259840965271, "regret_corner": 0.5961391925811768, "regret_row": 0.6581237316131592, "regret_any": 0.7137259840965271, "regret_bot": 0.7473499178886414, "value_dist": 0.13708607852458954, "value_other_env": 0.11582710593938828, "value_corner": 0.16897453367710114, "value_row": 0.1385652720928192, "value_any": 0.11582710593938828, "value_bot": 0.04933909699320793, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00047.png", "entropy": 1.3732761144638062} +{"ts": "2026-01-29T21:26:55.660189Z", "loop": 48, "env_steps": 29491200, "exact_value_avg": 0.1403750777244568, "regret_dist": 0.6634023189544678, "regret_other_env": 0.7141807675361633, "regret_corner": 0.5872345566749573, "regret_row": 0.6549412608146667, "regret_any": 0.7141807675361633, "regret_bot": 0.7491788864135742, "value_dist": 0.1403750777244568, "value_other_env": 0.11537230759859085, "value_corner": 0.1778792142868042, "value_row": 0.14174778759479523, "value_any": 0.11537230759859085, "value_bot": 0.047510139644145966, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00048.png", "entropy": 1.371502161026001} +{"ts": "2026-01-29T21:26:56.864342Z", "loop": 49, "env_steps": 30105600, "exact_value_avg": 0.1439717411994934, "regret_dist": 0.6598055958747864, "regret_other_env": 0.7146974205970764, "regret_corner": 0.5774678587913513, "regret_row": 0.6515267491340637, "regret_any": 0.7146974205970764, "regret_bot": 0.7510849833488464, "value_dist": 0.1439717411994934, "value_other_env": 0.11485567688941956, "value_corner": 0.18764585256576538, "value_row": 0.14516231417655945, "value_any": 0.11485567688941956, "value_bot": 0.04560408741235733, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00049.png", "entropy": 1.369449257850647} +{"ts": "2026-01-29T21:26:58.066572Z", "loop": 50, "env_steps": 30720000, "exact_value_avg": 0.14790885150432587, "regret_dist": 0.6558685302734375, "regret_other_env": 0.7152825593948364, "regret_corner": 0.5667473673820496, "regret_row": 0.6478860378265381, "regret_any": 0.7152825593948364, "regret_bot": 0.7530576586723328, "value_dist": 0.14790885150432587, "value_other_env": 0.11427053064107895, "value_corner": 0.19836632907390594, "value_row": 0.14880304038524628, "value_any": 0.11427053064107895, "value_bot": 0.04363140091300011, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00050.png", "entropy": 1.3670694828033447} +{"ts": "2026-01-29T21:26:59.271708Z", "loop": 51, "env_steps": 31334400, "exact_value_avg": 0.15221160650253296, "regret_dist": 0.6515657901763916, "regret_other_env": 0.7159428596496582, "regret_corner": 0.5550000667572021, "regret_row": 0.6440491676330566, "regret_any": 0.7159428596496582, "regret_bot": 0.7550698518753052, "value_dist": 0.15221160650253296, "value_other_env": 0.11361023783683777, "value_corner": 0.21011365950107574, "value_row": 0.15263991057872772, "value_any": 0.11361023783683777, "value_bot": 0.041619133204221725, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00051.png", "entropy": 1.3643136024475098} +{"ts": "2026-01-29T21:27:00.473907Z", "loop": 52, "env_steps": 31948800, "exact_value_avg": 0.15688276290893555, "regret_dist": 0.646894633769989, "regret_other_env": 0.7166861295700073, "regret_corner": 0.5422073006629944, "regret_row": 0.6400160789489746, "regret_any": 0.7166861295700073, "regret_bot": 0.7571161389350891, "value_dist": 0.15688276290893555, "value_other_env": 0.11286698281764984, "value_corner": 0.2229064553976059, "value_row": 0.15667298436164856, "value_any": 0.11286698281764984, "value_bot": 0.039572905749082565, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00052.png", "entropy": 1.3611207008361816} +{"ts": "2026-01-29T21:27:01.675493Z", "loop": 53, "env_steps": 32563200, "exact_value_avg": 0.16195082664489746, "regret_dist": 0.6418265700340271, "regret_other_env": 0.7175223231315613, "regret_corner": 0.5282829403877258, "regret_row": 0.635780930519104, "regret_any": 0.7175223231315613, "regret_bot": 0.759194016456604, "value_dist": 0.16195082664489746, "value_other_env": 0.11203084141016006, "value_corner": 0.23683081567287445, "value_row": 0.16090813279151917, "value_any": 0.11203084141016006, "value_bot": 0.03749498352408409, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00053.png", "entropy": 1.3574124574661255} +{"ts": "2026-01-29T21:27:02.877973Z", "loop": 54, "env_steps": 33177600, "exact_value_avg": 0.16744202375411987, "regret_dist": 0.6363353729248047, "regret_other_env": 0.7184621691703796, "regret_corner": 0.5131450295448303, "regret_row": 0.6313928365707397, "regret_any": 0.7184621691703796, "regret_bot": 0.7612881660461426, "value_dist": 0.16744202375411987, "value_other_env": 0.11109088361263275, "value_corner": 0.25196871161460876, "value_row": 0.16529622673988342, "value_any": 0.11109088361263275, "value_bot": 0.035400912165641785, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00054.png", "entropy": 1.3530875444412231} +{"ts": "2026-01-29T21:27:04.083290Z", "loop": 55, "env_steps": 33792000, "exact_value_avg": 0.17331275343894958, "regret_dist": 0.6304646730422974, "regret_other_env": 0.7195010185241699, "regret_corner": 0.49691006541252136, "regret_row": 0.6268599033355713, "regret_any": 0.7195010185241699, "regret_bot": 0.7633769512176514, "value_dist": 0.17331275343894958, "value_other_env": 0.11005213856697083, "value_corner": 0.2682036757469177, "value_row": 0.1698291003704071, "value_any": 0.11005213856697083, "value_bot": 0.0333121083676815, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00055.png", "entropy": 1.348099708557129} +{"ts": "2026-01-29T21:27:05.286178Z", "loop": 56, "env_steps": 34406400, "exact_value_avg": 0.17955590784549713, "regret_dist": 0.6242214441299438, "regret_other_env": 0.7206491827964783, "regret_corner": 0.4795798063278198, "regret_row": 0.6222306489944458, "regret_any": 0.7206491827964783, "regret_bot": 0.7654501795768738, "value_dist": 0.17955590784549713, "value_other_env": 0.1089039072394371, "value_corner": 0.2855339050292969, "value_row": 0.17445839941501617, "value_any": 0.1089039072394371, "value_bot": 0.031238898634910583, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00056.png", "entropy": 1.3423306941986084} +{"ts": "2026-01-29T21:27:06.488370Z", "loop": 57, "env_steps": 35020800, "exact_value_avg": 0.18613389134407043, "regret_dist": 0.6176434755325317, "regret_other_env": 0.7219075560569763, "regret_corner": 0.4612472951412201, "regret_row": 0.6175563931465149, "regret_any": 0.7219075560569763, "regret_bot": 0.7674852013587952, "value_dist": 0.18613389134407043, "value_other_env": 0.10764554888010025, "value_corner": 0.3038664162158966, "value_row": 0.1791326254606247, "value_any": 0.10764554888010025, "value_bot": 0.029203882440924644, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00057.png", "entropy": 1.335676908493042} +{"ts": "2026-01-29T21:27:07.689996Z", "loop": 58, "env_steps": 35635200, "exact_value_avg": 0.19305890798568726, "regret_dist": 0.6107183694839478, "regret_other_env": 0.7232885956764221, "regret_corner": 0.441863089799881, "regret_row": 0.6128413081169128, "regret_any": 0.7232885956764221, "regret_bot": 0.7694716453552246, "value_dist": 0.19305890798568726, "value_other_env": 0.10626442730426788, "value_corner": 0.3232506215572357, "value_row": 0.18384778499603271, "value_any": 0.10626442730426788, "value_bot": 0.027217388153076172, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00058.png", "entropy": 1.3279414176940918} +{"ts": "2026-01-29T21:27:08.895199Z", "loop": 59, "env_steps": 36249600, "exact_value_avg": 0.20027294754981995, "regret_dist": 0.6035044193267822, "regret_other_env": 0.7247923612594604, "regret_corner": 0.4215725064277649, "regret_row": 0.6081446409225464, "regret_any": 0.7247923612594604, "regret_bot": 0.7714048027992249, "value_dist": 0.20027294754981995, "value_other_env": 0.10476073622703552, "value_corner": 0.3435412347316742, "value_row": 0.18854445219039917, "value_any": 0.10476073622703552, "value_bot": 0.02528422325849533, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00059.png", "entropy": 1.3189697265625} +{"ts": "2026-01-29T21:27:10.099374Z", "loop": 60, "env_steps": 36864000, "exact_value_avg": 0.20769551396369934, "regret_dist": 0.5960818529129028, "regret_other_env": 0.7264055013656616, "regret_corner": 0.40059638023376465, "regret_row": 0.6035776138305664, "regret_any": 0.7264055013656616, "regret_bot": 0.7732534408569336, "value_dist": 0.20769551396369934, "value_other_env": 0.10314761102199554, "value_corner": 0.36451736092567444, "value_row": 0.19311143457889557, "value_any": 0.10314761102199554, "value_bot": 0.023435605689883232, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00060.png", "entropy": 1.308637022972107} +{"ts": "2026-01-29T21:27:11.302073Z", "loop": 61, "env_steps": 37478400, "exact_value_avg": 0.21522243320941925, "regret_dist": 0.5885549783706665, "regret_other_env": 0.7281160950660706, "regret_corner": 0.3792131841182709, "regret_row": 0.5991471409797668, "regret_any": 0.7281160950660706, "regret_bot": 0.7750135064125061, "value_dist": 0.21522243320941925, "value_other_env": 0.10143701732158661, "value_corner": 0.3859005272388458, "value_row": 0.19754184782505035, "value_any": 0.10143701732158661, "value_bot": 0.02167559415102005, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00061.png", "entropy": 1.2968136072158813} +{"ts": "2026-01-29T21:27:12.503905Z", "loop": 62, "env_steps": 38092800, "exact_value_avg": 0.22280213236808777, "regret_dist": 0.5809752941131592, "regret_other_env": 0.7299229502677917, "regret_corner": 0.35755378007888794, "regret_row": 0.5948530435562134, "regret_any": 0.7299229502677917, "regret_bot": 0.7766905426979065, "value_dist": 0.22280213236808777, "value_other_env": 0.0996302142739296, "value_corner": 0.40755996108055115, "value_row": 0.2018360197544098, "value_any": 0.0996302142739296, "value_bot": 0.01999850757420063, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00062.png", "entropy": 1.2832804918289185} +{"ts": "2026-01-29T21:27:13.708153Z", "loop": 63, "env_steps": 38707200, "exact_value_avg": 0.2303006798028946, "regret_dist": 0.5734766721725464, "regret_other_env": 0.7317994832992554, "regret_corner": 0.3359924256801605, "regret_row": 0.5907350182533264, "regret_any": 0.7317994832992554, "regret_bot": 0.7782753705978394, "value_dist": 0.2303006798028946, "value_other_env": 0.09775357693433762, "value_corner": 0.42912131547927856, "value_row": 0.20595401525497437, "value_any": 0.09775357693433762, "value_bot": 0.018413782119750977, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00063.png", "entropy": 1.2679650783538818} +{"ts": "2026-01-29T21:27:14.912291Z", "loop": 64, "env_steps": 39321600, "exact_value_avg": 0.23768483102321625, "regret_dist": 0.5660926103591919, "regret_other_env": 0.7337440848350525, "regret_corner": 0.31461527943611145, "regret_row": 0.5868507623672485, "regret_any": 0.7337440848350525, "regret_bot": 0.7797617316246033, "value_dist": 0.23768483102321625, "value_other_env": 0.09580904990434647, "value_corner": 0.45049849152565, "value_row": 0.20983830094337463, "value_any": 0.09580904990434647, "value_bot": 0.016927294433116913, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00064.png", "entropy": 1.2506767511367798} +{"ts": "2026-01-29T21:27:16.114738Z", "loop": 65, "env_steps": 39936000, "exact_value_avg": 0.24484242498874664, "regret_dist": 0.5589349269866943, "regret_other_env": 0.7357228994369507, "regret_corner": 0.2937529385089874, "regret_row": 0.5832030773162842, "regret_any": 0.7357228994369507, "regret_bot": 0.7811429500579834, "value_dist": 0.24484242498874664, "value_other_env": 0.0938301756978035, "value_corner": 0.47136080265045166, "value_row": 0.21348589658737183, "value_any": 0.0938301756978035, "value_bot": 0.015546104870736599, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00065.png", "entropy": 1.2313936948776245} +{"ts": "2026-01-29T21:27:17.318455Z", "loop": 66, "env_steps": 40550400, "exact_value_avg": 0.25170275568962097, "regret_dist": 0.552074670791626, "regret_other_env": 0.7377173900604248, "regret_corner": 0.27361050248146057, "regret_row": 0.5798970460891724, "regret_any": 0.7377173900604248, "regret_bot": 0.7824063301086426, "value_dist": 0.25170275568962097, "value_other_env": 0.09183574467897415, "value_corner": 0.4915032386779785, "value_row": 0.21679197251796722, "value_any": 0.09183574467897415, "value_bot": 0.01428270898759365, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00066.png", "entropy": 1.2100635766983032} +{"ts": "2026-01-29T21:27:18.521941Z", "loop": 67, "env_steps": 41164800, "exact_value_avg": 0.2581457197666168, "regret_dist": 0.5456316471099854, "regret_other_env": 0.7396870851516724, "regret_corner": 0.25454843044281006, "regret_row": 0.5769563913345337, "regret_any": 0.7396870851516724, "regret_bot": 0.7835448980331421, "value_dist": 0.2581457197666168, "value_other_env": 0.08986601233482361, "value_corner": 0.5105652809143066, "value_row": 0.21973268687725067, "value_any": 0.08986601233482361, "value_bot": 0.01314407680183649, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00067.png", "entropy": 1.1868995428085327} +{"ts": "2026-01-29T21:27:19.724576Z", "loop": 68, "env_steps": 41779200, "exact_value_avg": 0.26411503553390503, "regret_dist": 0.5396623611450195, "regret_other_env": 0.741592526435852, "regret_corner": 0.23676705360412598, "regret_row": 0.5745529532432556, "regret_any": 0.741592526435852, "regret_bot": 0.7845375537872314, "value_dist": 0.26411503553390503, "value_other_env": 0.08796059340238571, "value_corner": 0.5283467173576355, "value_row": 0.22213611006736755, "value_any": 0.08796059340238571, "value_bot": 0.012151464819908142, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00068.png", "entropy": 1.1623321771621704} +{"ts": "2026-01-29T21:27:20.929819Z", "loop": 69, "env_steps": 42393600, "exact_value_avg": 0.26959070563316345, "regret_dist": 0.5341866612434387, "regret_other_env": 0.7434213161468506, "regret_corner": 0.22033463418483734, "regret_row": 0.5724998116493225, "regret_any": 0.7434213161468506, "regret_bot": 0.785417377948761, "value_dist": 0.26959070563316345, "value_other_env": 0.08613176643848419, "value_corner": 0.5447791218757629, "value_row": 0.22418926656246185, "value_any": 0.08613176643848419, "value_bot": 0.011271635070443153, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00069.png", "entropy": 1.1364877223968506} +{"ts": "2026-01-29T21:27:22.136806Z", "loop": 70, "env_steps": 43008000, "exact_value_avg": 0.2746220529079437, "regret_dist": 0.5291553735733032, "regret_other_env": 0.7451717853546143, "regret_corner": 0.2051306813955307, "regret_row": 0.5708040595054626, "regret_any": 0.7451717853546143, "regret_bot": 0.7861950993537903, "value_dist": 0.2746220529079437, "value_other_env": 0.08438136428594589, "value_corner": 0.5599830746650696, "value_row": 0.22588500380516052, "value_any": 0.08438136428594589, "value_bot": 0.01049390621483326, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00070.png", "entropy": 1.1094565391540527} +{"ts": "2026-01-29T21:27:23.339339Z", "loop": 71, "env_steps": 43622400, "exact_value_avg": 0.27914848923683167, "regret_dist": 0.5246288776397705, "regret_other_env": 0.7467987537384033, "regret_corner": 0.1913740187883377, "regret_row": 0.5696164965629578, "regret_any": 0.7467987537384033, "regret_bot": 0.7868531942367554, "value_dist": 0.27914848923683167, "value_other_env": 0.08275434374809265, "value_corner": 0.5737397074699402, "value_row": 0.22707252204418182, "value_any": 0.08275434374809265, "value_bot": 0.009835819713771343, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00071.png", "entropy": 1.0821216106414795} +{"ts": "2026-01-29T21:27:24.543996Z", "loop": 72, "env_steps": 44236800, "exact_value_avg": 0.28318485617637634, "regret_dist": 0.5205925107002258, "regret_other_env": 0.7483152151107788, "regret_corner": 0.17900840938091278, "regret_row": 0.5686254501342773, "regret_any": 0.7483152151107788, "regret_bot": 0.7874355912208557, "value_dist": 0.28318485617637634, "value_other_env": 0.08123791962862015, "value_corner": 0.5861052870750427, "value_row": 0.22806358337402344, "value_any": 0.08123791962862015, "value_bot": 0.009253399446606636, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00072.png", "entropy": 1.0544239282608032} +{"ts": "2026-01-29T21:27:25.750089Z", "loop": 73, "env_steps": 44851200, "exact_value_avg": 0.2867906093597412, "regret_dist": 0.5169867277145386, "regret_other_env": 0.7497034668922424, "regret_corner": 0.1679116189479828, "regret_row": 0.5680332183837891, "regret_any": 0.7497034668922424, "regret_bot": 0.7879255414009094, "value_dist": 0.2867906093597412, "value_other_env": 0.07984956353902817, "value_corner": 0.5972021222114563, "value_row": 0.2286558896303177, "value_any": 0.07984956353902817, "value_bot": 0.00876341387629509, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00073.png", "entropy": 1.0270819664001465} +{"ts": "2026-01-29T21:27:26.952988Z", "loop": 74, "env_steps": 45465600, "exact_value_avg": 0.2899884581565857, "regret_dist": 0.5137888789176941, "regret_other_env": 0.7509744167327881, "regret_corner": 0.1580105572938919, "regret_row": 0.5676447153091431, "regret_any": 0.7509744167327881, "regret_bot": 0.7883505821228027, "value_dist": 0.2899884581565857, "value_other_env": 0.0785786435008049, "value_corner": 0.607103168964386, "value_row": 0.2290443629026413, "value_any": 0.0785786435008049, "value_bot": 0.0083384457975626, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00074.png", "entropy": 1.0001219511032104} +{"ts": "2026-01-29T21:27:28.158552Z", "loop": 75, "env_steps": 46080000, "exact_value_avg": 0.2927948236465454, "regret_dist": 0.5109825730323792, "regret_other_env": 0.752132773399353, "regret_corner": 0.14925719797611237, "regret_row": 0.5674065947532654, "regret_any": 0.752132773399353, "regret_bot": 0.7887212038040161, "value_dist": 0.2927948236465454, "value_other_env": 0.07742032408714294, "value_corner": 0.6158565878868103, "value_row": 0.2292824387550354, "value_any": 0.07742032408714294, "value_bot": 0.007967823185026646, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00075.png", "entropy": 0.9737964272499084} +{"ts": "2026-01-29T21:27:29.363624Z", "loop": 76, "env_steps": 46694400, "exact_value_avg": 0.29526764154434204, "regret_dist": 0.5085097551345825, "regret_other_env": 0.7531638145446777, "regret_corner": 0.1415286362171173, "regret_row": 0.5676336884498596, "regret_any": 0.7531638145446777, "regret_bot": 0.7890110611915588, "value_dist": 0.29526764154434204, "value_other_env": 0.07638932019472122, "value_corner": 0.6235851049423218, "value_row": 0.22905534505844116, "value_any": 0.07638932019472122, "value_bot": 0.00767802819609642, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00076.png", "entropy": 0.9490031599998474} +{"ts": "2026-01-29T21:27:30.567021Z", "loop": 77, "env_steps": 47308800, "exact_value_avg": 0.2974741458892822, "regret_dist": 0.5063032507896423, "regret_other_env": 0.7540866732597351, "regret_corner": 0.13462801277637482, "regret_row": 0.5682156085968018, "regret_any": 0.7540866732597351, "regret_bot": 0.7892414927482605, "value_dist": 0.2974741458892822, "value_other_env": 0.07546642422676086, "value_corner": 0.6304857134819031, "value_row": 0.2284734547138214, "value_any": 0.07546642422676086, "value_bot": 0.007447476498782635, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00077.png", "entropy": 0.9255740642547607} +{"ts": "2026-01-29T21:27:31.771203Z", "loop": 78, "env_steps": 47923200, "exact_value_avg": 0.29939180612564087, "regret_dist": 0.5043855905532837, "regret_other_env": 0.7548925280570984, "regret_corner": 0.12862513959407806, "regret_row": 0.5691400170326233, "regret_any": 0.7548925280570984, "regret_bot": 0.789411187171936, "value_dist": 0.29939180612564087, "value_other_env": 0.07466059178113937, "value_corner": 0.6364886164665222, "value_row": 0.22754906117916107, "value_any": 0.07466059178113937, "value_bot": 0.007277801167219877, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00078.png", "entropy": 0.9041509628295898} +{"ts": "2026-01-29T21:27:32.975244Z", "loop": 79, "env_steps": 48537600, "exact_value_avg": 0.301079124212265, "regret_dist": 0.5026982426643372, "regret_other_env": 0.7555983066558838, "regret_corner": 0.12334813177585602, "regret_row": 0.5704201459884644, "regret_any": 0.7555983066558838, "regret_bot": 0.7895265221595764, "value_dist": 0.301079124212265, "value_other_env": 0.07395476847887039, "value_corner": 0.6417656540870667, "value_row": 0.2262689471244812, "value_any": 0.07395476847887039, "value_bot": 0.007162508554756641, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00079.png", "entropy": 0.8846181035041809} +{"ts": "2026-01-29T21:27:34.179882Z", "loop": 80, "env_steps": 49152000, "exact_value_avg": 0.3025747537612915, "regret_dist": 0.5012025833129883, "regret_other_env": 0.7562212347984314, "regret_corner": 0.1186746284365654, "regret_row": 0.5720959901809692, "regret_any": 0.7562212347984314, "regret_bot": 0.7895890474319458, "value_dist": 0.3025747537612915, "value_other_env": 0.073331817984581, "value_corner": 0.6464391350746155, "value_row": 0.22459302842617035, "value_any": 0.073331817984581, "value_bot": 0.007100082468241453, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00080.png", "entropy": 0.8668220639228821} +{"ts": "2026-01-29T21:27:35.418634Z", "loop": 81, "env_steps": 49766400, "exact_value_avg": 0.3038904666900635, "regret_dist": 0.4998868703842163, "regret_other_env": 0.7567827701568604, "regret_corner": 0.11454299092292786, "regret_row": 0.5740786194801331, "regret_any": 0.7567827701568604, "regret_bot": 0.7896138429641724, "value_dist": 0.3038904666900635, "value_other_env": 0.07277031987905502, "value_corner": 0.6505706906318665, "value_row": 0.22261039912700653, "value_any": 0.07277031987905502, "value_bot": 0.0070752594619989395, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00081.png", "entropy": 0.8503040671348572} +{"ts": "2026-01-29T21:27:36.622422Z", "loop": 82, "env_steps": 50380800, "exact_value_avg": 0.30503636598587036, "regret_dist": 0.4987410008907318, "regret_other_env": 0.7572895884513855, "regret_corner": 0.1109180599451065, "regret_row": 0.5763017535209656, "regret_any": 0.7572895884513855, "regret_bot": 0.7896057963371277, "value_dist": 0.30503636598587036, "value_other_env": 0.07226349413394928, "value_corner": 0.6541956663131714, "value_row": 0.2203873097896576, "value_any": 0.07226349413394928, "value_bot": 0.007083241827785969, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00082.png", "entropy": 0.8350101709365845} +{"ts": "2026-01-29T21:27:37.829500Z", "loop": 83, "env_steps": 50995200, "exact_value_avg": 0.30599337816238403, "regret_dist": 0.49778398871421814, "regret_other_env": 0.7577361464500427, "regret_corner": 0.10785572975873947, "regret_row": 0.5788238048553467, "regret_any": 0.7577361464500427, "regret_bot": 0.7895601987838745, "value_dist": 0.30599337816238403, "value_other_env": 0.07181695848703384, "value_corner": 0.6572580337524414, "value_row": 0.2178652584552765, "value_any": 0.07181695848703384, "value_bot": 0.007128826342523098, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00083.png", "entropy": 0.8212588429450989} +{"ts": "2026-01-29T21:27:39.032202Z", "loop": 84, "env_steps": 51609600, "exact_value_avg": 0.3067586421966553, "regret_dist": 0.4970187544822693, "regret_other_env": 0.7581304907798767, "regret_corner": 0.10535112023353577, "regret_row": 0.5812982320785522, "regret_any": 0.7581304907798767, "regret_bot": 0.7895017266273499, "value_dist": 0.3067586421966553, "value_other_env": 0.07142266631126404, "value_corner": 0.6597626209259033, "value_row": 0.21539078652858734, "value_any": 0.07142266631126404, "value_bot": 0.007187272422015667, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00084.png", "entropy": 0.808853030204773} +{"ts": "2026-01-29T21:27:40.242964Z", "loop": 85, "env_steps": 52224000, "exact_value_avg": 0.30734241008758545, "regret_dist": 0.4964349865913391, "regret_other_env": 0.7584669589996338, "regret_corner": 0.10338699817657471, "regret_row": 0.5838974714279175, "regret_any": 0.7584669589996338, "regret_bot": 0.7894142866134644, "value_dist": 0.30734241008758545, "value_other_env": 0.07108616083860397, "value_corner": 0.661726713180542, "value_row": 0.2127915769815445, "value_any": 0.07108616083860397, "value_bot": 0.007274738512933254, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00085.png", "entropy": 0.7980553507804871} +{"ts": "2026-01-29T21:27:41.446500Z", "loop": 86, "env_steps": 52838400, "exact_value_avg": 0.3077804744243622, "regret_dist": 0.49599689245224, "regret_other_env": 0.7587647438049316, "regret_corner": 0.10184504091739655, "regret_row": 0.5864700675010681, "regret_any": 0.7587647438049316, "regret_bot": 0.7893165946006775, "value_dist": 0.3077804744243622, "value_other_env": 0.07078832387924194, "value_corner": 0.6632686853408813, "value_row": 0.21021901071071625, "value_any": 0.07078832387924194, "value_bot": 0.007372410036623478, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00086.png", "entropy": 0.7883017063140869} +{"ts": "2026-01-29T21:27:42.649644Z", "loop": 87, "env_steps": 53452800, "exact_value_avg": 0.30808180570602417, "regret_dist": 0.49569565057754517, "regret_other_env": 0.7590317726135254, "regret_corner": 0.10069142282009125, "regret_row": 0.5891507267951965, "regret_any": 0.7590317726135254, "regret_bot": 0.7891967296600342, "value_dist": 0.30808180570602417, "value_other_env": 0.07052140682935715, "value_corner": 0.664422333240509, "value_row": 0.20753832161426544, "value_any": 0.07052140682935715, "value_bot": 0.007492367178201675, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00087.png", "entropy": 0.7794496417045593} +{"ts": "2026-01-29T21:27:43.852254Z", "loop": 88, "env_steps": 54067200, "exact_value_avg": 0.3082308769226074, "regret_dist": 0.4955465495586395, "regret_other_env": 0.759279191493988, "regret_corner": 0.0999474972486496, "regret_row": 0.5921661853790283, "regret_any": 0.759279191493988, "regret_bot": 0.7890408635139465, "value_dist": 0.3082308769226074, "value_other_env": 0.07027389854192734, "value_corner": 0.6651662588119507, "value_row": 0.20452290773391724, "value_any": 0.07027389854192734, "value_bot": 0.007648172788321972, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00088.png", "entropy": 0.7711803913116455} +{"ts": "2026-01-29T21:27:45.056790Z", "loop": 89, "env_steps": 54681600, "exact_value_avg": 0.3083708882331848, "regret_dist": 0.49540647864341736, "regret_other_env": 0.7594872117042542, "regret_corner": 0.09928534179925919, "regret_row": 0.5940138697624207, "regret_any": 0.7594872117042542, "regret_bot": 0.7889639139175415, "value_dist": 0.3083708882331848, "value_other_env": 0.07006587833166122, "value_corner": 0.6658283472061157, "value_row": 0.20267517864704132, "value_any": 0.07006587833166122, "value_bot": 0.007725169416517019, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00089.png", "entropy": 0.7639880776405334} +{"ts": "2026-01-29T21:27:46.263003Z", "loop": 90, "env_steps": 55296000, "exact_value_avg": 0.30856841802597046, "regret_dist": 0.4952089488506317, "regret_other_env": 0.7596715092658997, "regret_corner": 0.098515085875988, "regret_row": 0.5948960781097412, "regret_any": 0.7596715092658997, "regret_bot": 0.7889578938484192, "value_dist": 0.30856841802597046, "value_other_env": 0.06988158077001572, "value_corner": 0.6665986776351929, "value_row": 0.20179301500320435, "value_any": 0.06988158077001572, "value_bot": 0.007731173187494278, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00090.png", "entropy": 0.7574840188026428} +{"ts": "2026-01-29T21:27:47.466115Z", "loop": 91, "env_steps": 55910400, "exact_value_avg": 0.3088020980358124, "regret_dist": 0.4949752688407898, "regret_other_env": 0.7598226070404053, "regret_corner": 0.0977041944861412, "regret_row": 0.5949969291687012, "regret_any": 0.7598226070404053, "regret_bot": 0.789004385471344, "value_dist": 0.3088020980358124, "value_other_env": 0.0697304755449295, "value_corner": 0.6674095392227173, "value_row": 0.2016921490430832, "value_any": 0.0697304755449295, "value_bot": 0.007684743497520685, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00091.png", "entropy": 0.751971960067749} +{"ts": "2026-01-29T21:27:48.671434Z", "loop": 92, "env_steps": 56524800, "exact_value_avg": 0.3090873062610626, "regret_dist": 0.49469006061553955, "regret_other_env": 0.7599467039108276, "regret_corner": 0.09680501371622086, "regret_row": 0.5942338109016418, "regret_any": 0.7599467039108276, "regret_bot": 0.789110541343689, "value_dist": 0.3090873062610626, "value_other_env": 0.06960637122392654, "value_corner": 0.6683087348937988, "value_row": 0.20245520770549774, "value_any": 0.06960637122392654, "value_bot": 0.0075784530490636826, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00092.png", "entropy": 0.7473070621490479} +{"ts": "2026-01-29T21:27:49.884567Z", "loop": 93, "env_steps": 57139200, "exact_value_avg": 0.30939048528671265, "regret_dist": 0.4943869113922119, "regret_other_env": 0.7600467801094055, "regret_corner": 0.09589707851409912, "regret_row": 0.5928019881248474, "regret_any": 0.7600467801094055, "regret_bot": 0.7892610430717468, "value_dist": 0.30939048528671265, "value_other_env": 0.06950633227825165, "value_corner": 0.6692166924476624, "value_row": 0.20388703048229218, "value_any": 0.06950633227825165, "value_bot": 0.007428058423101902, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00093.png", "entropy": 0.7434462904930115} +{"ts": "2026-01-29T21:27:51.090562Z", "loop": 94, "env_steps": 57753600, "exact_value_avg": 0.3096752166748047, "regret_dist": 0.4941021203994751, "regret_other_env": 0.7601311206817627, "regret_corner": 0.09505860507488251, "regret_row": 0.590729832649231, "regret_any": 0.7601311206817627, "regret_bot": 0.7894505262374878, "value_dist": 0.3096752166748047, "value_other_env": 0.06942193955183029, "value_corner": 0.6700551509857178, "value_row": 0.205959290266037, "value_any": 0.06942193955183029, "value_bot": 0.00723855197429657, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00094.png", "entropy": 0.7401105165481567} +{"ts": "2026-01-29T21:27:52.294572Z", "loop": 95, "env_steps": 58368000, "exact_value_avg": 0.3098859488964081, "regret_dist": 0.4938914179801941, "regret_other_env": 0.7602070569992065, "regret_corner": 0.09441794455051422, "regret_row": 0.5887377858161926, "regret_any": 0.7602070569992065, "regret_bot": 0.7896251082420349, "value_dist": 0.3098859488964081, "value_other_env": 0.06934602558612823, "value_corner": 0.6706957817077637, "value_row": 0.20795126259326935, "value_any": 0.06934602558612823, "value_bot": 0.007063896395266056, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00095.png", "entropy": 0.7370206713676453} +{"ts": "2026-01-29T21:27:53.500308Z", "loop": 96, "env_steps": 58982400, "exact_value_avg": 0.31003162264823914, "regret_dist": 0.4937458038330078, "regret_other_env": 0.7602706551551819, "regret_corner": 0.09395844489336014, "regret_row": 0.5857909917831421, "regret_any": 0.7602706551551819, "regret_bot": 0.7898590564727783, "value_dist": 0.31003162264823914, "value_other_env": 0.06928244233131409, "value_corner": 0.6711553335189819, "value_row": 0.2108980268239975, "value_any": 0.06928244233131409, "value_bot": 0.006829879246652126, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00096.png", "entropy": 0.7342857122421265} +{"ts": "2026-01-29T21:27:54.703286Z", "loop": 97, "env_steps": 59596800, "exact_value_avg": 0.3100450336933136, "regret_dist": 0.49373236298561096, "regret_other_env": 0.7603344917297363, "regret_corner": 0.09382911771535873, "regret_row": 0.5822581052780151, "regret_any": 0.7603344917297363, "regret_bot": 0.7901246547698975, "value_dist": 0.3100450336933136, "value_other_env": 0.06921855360269547, "value_corner": 0.6712846755981445, "value_row": 0.21443094313144684, "value_any": 0.06921855360269547, "value_bot": 0.006564426235854626, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00097.png", "entropy": 0.7314297556877136} +{"ts": "2026-01-29T21:27:55.907615Z", "loop": 98, "env_steps": 60211200, "exact_value_avg": 0.3099119961261749, "regret_dist": 0.49386537075042725, "regret_other_env": 0.7604028582572937, "regret_corner": 0.09405914694070816, "regret_row": 0.5788333415985107, "regret_any": 0.7604028582572937, "regret_bot": 0.7903719544410706, "value_dist": 0.3099119961261749, "value_other_env": 0.06915026903152466, "value_corner": 0.6710545420646667, "value_row": 0.21785566210746765, "value_any": 0.06915026903152466, "value_bot": 0.006317040417343378, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00098.png", "entropy": 0.7283978462219238} +{"ts": "2026-01-29T21:27:57.112856Z", "loop": 99, "env_steps": 60825600, "exact_value_avg": 0.3097144663333893, "regret_dist": 0.4940629303455353, "regret_other_env": 0.7604769468307495, "regret_corner": 0.09444186091423035, "regret_row": 0.5760840177536011, "regret_any": 0.7604769468307495, "regret_bot": 0.7905681133270264, "value_dist": 0.3097144663333893, "value_other_env": 0.06907617300748825, "value_corner": 0.6706718802452087, "value_row": 0.2206050157546997, "value_any": 0.06907617300748825, "value_bot": 0.006120986305177212, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00099.png", "entropy": 0.7252113223075867} +{"ts": "2026-01-29T21:27:58.315872Z", "loop": 100, "env_steps": 61440000, "exact_value_avg": 0.30950337648391724, "regret_dist": 0.4942740201950073, "regret_other_env": 0.7605493068695068, "regret_corner": 0.09486103057861328, "regret_row": 0.573904275894165, "regret_any": 0.7605493068695068, "regret_bot": 0.7907244563102722, "value_dist": 0.30950337648391724, "value_other_env": 0.06900373846292496, "value_corner": 0.670252799987793, "value_row": 0.22278481721878052, "value_any": 0.06900373846292496, "value_bot": 0.005964657757431269, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00100.png", "entropy": 0.7221852540969849} +{"ts": "2026-01-29T21:27:59.519888Z", "loop": 101, "env_steps": 62054400, "exact_value_avg": 0.3094632029533386, "regret_dist": 0.49431419372558594, "regret_other_env": 0.7606005668640137, "regret_corner": 0.09488456696271896, "regret_row": 0.5732777714729309, "regret_any": 0.7606005668640137, "regret_bot": 0.7907774448394775, "value_dist": 0.3094632029533386, "value_other_env": 0.0689525380730629, "value_corner": 0.6702291965484619, "value_row": 0.22341132164001465, "value_any": 0.0689525380730629, "value_bot": 0.005911593791097403, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00101.png", "entropy": 0.7202247977256775} +{"ts": "2026-01-29T21:28:00.725127Z", "loop": 102, "env_steps": 62668800, "exact_value_avg": 0.30960315465927124, "regret_dist": 0.4941742420196533, "regret_other_env": 0.7606302499771118, "regret_corner": 0.09449020028114319, "regret_row": 0.5739896893501282, "regret_any": 0.7606302499771118, "regret_bot": 0.7907423377037048, "value_dist": 0.30960315465927124, "value_other_env": 0.06892289221286774, "value_corner": 0.6706235408782959, "value_row": 0.2226993888616562, "value_any": 0.06892289221286774, "value_bot": 0.005946754477918148, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00102.png", "entropy": 0.7192450165748596} +{"ts": "2026-01-29T21:28:01.933131Z", "loop": 103, "env_steps": 63283200, "exact_value_avg": 0.3098222017288208, "regret_dist": 0.49395516514778137, "regret_other_env": 0.7606467008590698, "regret_corner": 0.09391786903142929, "regret_row": 0.575514018535614, "regret_any": 0.7606467008590698, "regret_bot": 0.7906511425971985, "value_dist": 0.3098222017288208, "value_other_env": 0.06890637427568436, "value_corner": 0.6711958646774292, "value_row": 0.22117502987384796, "value_any": 0.06890637427568436, "value_bot": 0.00603797473013401, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00103.png", "entropy": 0.7189529538154602} +{"ts": "2026-01-29T21:28:03.141240Z", "loop": 104, "env_steps": 63897600, "exact_value_avg": 0.3100588321685791, "regret_dist": 0.49371856451034546, "regret_other_env": 0.7606549859046936, "regret_corner": 0.09331389516592026, "regret_row": 0.5774969458580017, "regret_any": 0.7606549859046936, "regret_bot": 0.7905271053314209, "value_dist": 0.3100588321685791, "value_other_env": 0.06889813393354416, "value_corner": 0.6717998385429382, "value_row": 0.21919213235378265, "value_any": 0.06889813393354416, "value_bot": 0.006161893252283335, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00104.png", "entropy": 0.7189707159996033} +{"ts": "2026-01-29T21:28:04.344586Z", "loop": 105, "env_steps": 64512000, "exact_value_avg": 0.3102911114692688, "regret_dist": 0.493486225605011, "regret_other_env": 0.7606579661369324, "regret_corner": 0.09272858500480652, "regret_row": 0.5801388621330261, "regret_any": 0.7606579661369324, "regret_bot": 0.7903568148612976, "value_dist": 0.3102911114692688, "value_other_env": 0.0688951313495636, "value_corner": 0.6723850965499878, "value_row": 0.21655015647411346, "value_any": 0.0688951313495636, "value_bot": 0.00633222097530961, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00105.png", "entropy": 0.719210684299469} +{"ts": "2026-01-29T21:28:05.546890Z", "loop": 106, "env_steps": 65126400, "exact_value_avg": 0.31047120690345764, "regret_dist": 0.49330615997314453, "regret_other_env": 0.7606629729270935, "regret_corner": 0.09227091073989868, "regret_row": 0.5837278962135315, "regret_any": 0.7606629729270935, "regret_bot": 0.790117084980011, "value_dist": 0.31047120690345764, "value_other_env": 0.06889013946056366, "value_corner": 0.672842800617218, "value_row": 0.2129611074924469, "value_any": 0.06889013946056366, "value_bot": 0.00657196668908, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00106.png", "entropy": 0.7194600105285645} +{"ts": "2026-01-29T21:28:06.750253Z", "loop": 107, "env_steps": 65740800, "exact_value_avg": 0.3105173110961914, "regret_dist": 0.49326005578041077, "regret_other_env": 0.7606740593910217, "regret_corner": 0.09213902801275253, "regret_row": 0.5871252417564392, "regret_any": 0.7606740593910217, "regret_bot": 0.7898843288421631, "value_dist": 0.3105173110961914, "value_other_env": 0.06887901574373245, "value_corner": 0.672974705696106, "value_row": 0.20956376194953918, "value_any": 0.06887901574373245, "value_bot": 0.006804763805121183, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00107.png", "entropy": 0.719354510307312} +{"ts": "2026-01-29T21:28:07.955378Z", "loop": 108, "env_steps": 66355200, "exact_value_avg": 0.31044715642929077, "regret_dist": 0.4933302402496338, "regret_other_env": 0.7606964111328125, "regret_corner": 0.09228098392486572, "regret_row": 0.5902712345123291, "regret_any": 0.7606964111328125, "regret_bot": 0.7896640300750732, "value_dist": 0.31044715642929077, "value_other_env": 0.06885670125484467, "value_corner": 0.6728327870368958, "value_row": 0.20641779899597168, "value_any": 0.06885670125484467, "value_bot": 0.007025026250630617, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00108.png", "entropy": 0.7188180685043335} +{"ts": "2026-01-29T21:28:09.165266Z", "loop": 109, "env_steps": 66969600, "exact_value_avg": 0.3103354573249817, "regret_dist": 0.4934418499469757, "regret_other_env": 0.7607185244560242, "regret_corner": 0.09252683818340302, "regret_row": 0.5925346612930298, "regret_any": 0.7607185244560242, "regret_bot": 0.7895020842552185, "value_dist": 0.3103354573249817, "value_other_env": 0.06883454322814941, "value_corner": 0.6725868582725525, "value_row": 0.20415440201759338, "value_any": 0.06883454322814941, "value_bot": 0.0071869585663080215, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00109.png", "entropy": 0.7181439399719238} +{"ts": "2026-01-29T21:28:10.370826Z", "loop": 110, "env_steps": 67584000, "exact_value_avg": 0.31019559502601624, "regret_dist": 0.4935818314552307, "regret_other_env": 0.7607424855232239, "regret_corner": 0.09284081310033798, "regret_row": 0.5945268869400024, "regret_any": 0.7607424855232239, "regret_bot": 0.7893577814102173, "value_dist": 0.31019559502601624, "value_other_env": 0.06881068646907806, "value_corner": 0.6722729206085205, "value_row": 0.20216216146945953, "value_any": 0.06881068646907806, "value_bot": 0.007331342902034521, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00110.png", "entropy": 0.7173587679862976} +{"ts": "2026-01-29T21:28:11.572986Z", "loop": 111, "env_steps": 68198400, "exact_value_avg": 0.3100677728652954, "regret_dist": 0.49370959401130676, "regret_other_env": 0.7607598900794983, "regret_corner": 0.09313412755727768, "regret_row": 0.5959349274635315, "regret_any": 0.7607598900794983, "regret_bot": 0.7892541885375977, "value_dist": 0.3100677728652954, "value_other_env": 0.0687931701540947, "value_corner": 0.6719796061515808, "value_row": 0.20075412094593048, "value_any": 0.0687931701540947, "value_bot": 0.0074349213391542435, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00111.png", "entropy": 0.7167564034461975} +{"ts": "2026-01-29T21:28:12.774338Z", "loop": 112, "env_steps": 68812800, "exact_value_avg": 0.3099724352359772, "regret_dist": 0.4938048720359802, "regret_other_env": 0.7607790231704712, "regret_corner": 0.09334366768598557, "regret_row": 0.5969322919845581, "regret_any": 0.7607790231704712, "regret_bot": 0.7891806364059448, "value_dist": 0.3099724352359772, "value_other_env": 0.06877407431602478, "value_corner": 0.6717699766159058, "value_row": 0.19975672662258148, "value_any": 0.06877407431602478, "value_bot": 0.00750837754458189, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00112.png", "entropy": 0.7161062955856323} +{"ts": "2026-01-29T21:28:13.978133Z", "loop": 113, "env_steps": 69427200, "exact_value_avg": 0.30983567237854004, "regret_dist": 0.49394169449806213, "regret_other_env": 0.7607983350753784, "regret_corner": 0.09365667402744293, "regret_row": 0.5981318950653076, "regret_any": 0.7607983350753784, "regret_bot": 0.789091169834137, "value_dist": 0.30983567237854004, "value_other_env": 0.06875476986169815, "value_corner": 0.671457052230835, "value_row": 0.19855715334415436, "value_any": 0.06875476986169815, "value_bot": 0.007597915828227997, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00113.png", "entropy": 0.7154543399810791} +{"ts": "2026-01-29T21:28:15.179971Z", "loop": 114, "env_steps": 70041600, "exact_value_avg": 0.30982452630996704, "regret_dist": 0.4939528703689575, "regret_other_env": 0.7608050107955933, "regret_corner": 0.09367457032203674, "regret_row": 0.598258376121521, "regret_any": 0.7608050107955933, "regret_bot": 0.7890831828117371, "value_dist": 0.30982452630996704, "value_other_env": 0.0687481164932251, "value_corner": 0.6714391708374023, "value_row": 0.19843071699142456, "value_any": 0.0687481164932251, "value_bot": 0.007605810184031725, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00114.png", "entropy": 0.7151826620101929} +{"ts": "2026-01-29T21:28:16.383586Z", "loop": 115, "env_steps": 70656000, "exact_value_avg": 0.30987808108329773, "regret_dist": 0.49389928579330444, "regret_other_env": 0.7608106136322021, "regret_corner": 0.09353229403495789, "regret_row": 0.5979389548301697, "regret_any": 0.7608106136322021, "regret_bot": 0.7891101241111755, "value_dist": 0.30987808108329773, "value_other_env": 0.06874247640371323, "value_corner": 0.6715814471244812, "value_row": 0.1987500935792923, "value_any": 0.06874247640371323, "value_bot": 0.007578915450721979, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00115.png", "entropy": 0.7149384021759033} +{"ts": "2026-01-29T21:28:17.585056Z", "loop": 116, "env_steps": 71270400, "exact_value_avg": 0.3098752796649933, "regret_dist": 0.4939020872116089, "regret_other_env": 0.7608252167701721, "regret_corner": 0.09351740032434464, "regret_row": 0.5981443524360657, "regret_any": 0.7608252167701721, "regret_bot": 0.7890987396240234, "value_dist": 0.3098752796649933, "value_other_env": 0.06872793287038803, "value_corner": 0.6715962886810303, "value_row": 0.19854477047920227, "value_any": 0.06872793287038803, "value_bot": 0.007590337190777063, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00116.png", "entropy": 0.7143399119377136} +{"ts": "2026-01-29T21:28:18.787705Z", "loop": 117, "env_steps": 71884800, "exact_value_avg": 0.3100537657737732, "regret_dist": 0.49372363090515137, "regret_other_env": 0.7608208656311035, "regret_corner": 0.09307771176099777, "regret_row": 0.596758246421814, "regret_any": 0.7608208656311035, "regret_bot": 0.7892082333564758, "value_dist": 0.3100537657737732, "value_other_env": 0.06873226910829544, "value_corner": 0.6720359921455383, "value_row": 0.19993075728416443, "value_any": 0.06873226910829544, "value_bot": 0.0074808127246797085, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00117.png", "entropy": 0.7143815755844116} +{"ts": "2026-01-29T21:28:19.991657Z", "loop": 118, "env_steps": 72499200, "exact_value_avg": 0.3101998567581177, "regret_dist": 0.4935775101184845, "regret_other_env": 0.7608195543289185, "regret_corner": 0.09271442145109177, "regret_row": 0.5954774022102356, "regret_any": 0.7608195543289185, "regret_bot": 0.7893088459968567, "value_dist": 0.3101998567581177, "value_other_env": 0.06873353570699692, "value_corner": 0.6723992824554443, "value_row": 0.20121167600154877, "value_any": 0.06873353570699692, "value_bot": 0.007380193565040827, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00118.png", "entropy": 0.7143188118934631} +{"ts": "2026-01-29T21:28:21.194618Z", "loop": 119, "env_steps": 73113600, "exact_value_avg": 0.31040114164352417, "regret_dist": 0.4933762550354004, "regret_other_env": 0.7608116865158081, "regret_corner": 0.09222305566072464, "regret_row": 0.5932556986808777, "regret_any": 0.7608116865158081, "regret_bot": 0.789476752281189, "value_dist": 0.31040114164352417, "value_other_env": 0.06874144077301025, "value_corner": 0.6728906631469727, "value_row": 0.20343340933322906, "value_any": 0.06874144077301025, "value_bot": 0.00721219414845109, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00119.png", "entropy": 0.7144536972045898} +{"ts": "2026-01-29T21:28:22.397478Z", "loop": 120, "env_steps": 73728000, "exact_value_avg": 0.3105844259262085, "regret_dist": 0.4931929409503937, "regret_other_env": 0.7608023285865784, "regret_corner": 0.09177880734205246, "regret_row": 0.5902443528175354, "regret_any": 0.7608023285865784, "regret_bot": 0.7896975874900818, "value_dist": 0.3105844259262085, "value_other_env": 0.0687507688999176, "value_corner": 0.6733348965644836, "value_row": 0.20644471049308777, "value_any": 0.0687507688999176, "value_bot": 0.006991417147219181, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00120.png", "entropy": 0.7145749926567078} +{"ts": "2026-01-29T21:28:23.599736Z", "loop": 121, "env_steps": 74342400, "exact_value_avg": 0.3106706440448761, "regret_dist": 0.49310678243637085, "regret_other_env": 0.7607986330986023, "regret_corner": 0.09156893938779831, "regret_row": 0.586591362953186, "regret_any": 0.7607986330986023, "regret_bot": 0.7899571657180786, "value_dist": 0.3106706440448761, "value_other_env": 0.06875444948673248, "value_corner": 0.6735448837280273, "value_row": 0.21009768545627594, "value_any": 0.06875444948673248, "value_bot": 0.006731810513883829, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00121.png", "entropy": 0.7144074440002441} +{"ts": "2026-01-29T21:28:24.803540Z", "loop": 122, "env_steps": 74956800, "exact_value_avg": 0.3105986416339874, "regret_dist": 0.4931788146495819, "regret_other_env": 0.7608062028884888, "regret_corner": 0.09173763543367386, "regret_row": 0.5826380848884583, "regret_any": 0.7608062028884888, "regret_bot": 0.7902302145957947, "value_dist": 0.3105986416339874, "value_other_env": 0.06874693185091019, "value_corner": 0.6733761429786682, "value_row": 0.21405096352100372, "value_any": 0.06874693185091019, "value_bot": 0.006458835676312447, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00122.png", "entropy": 0.7137044668197632} +{"ts": "2026-01-29T21:28:26.004993Z", "loop": 123, "env_steps": 75571200, "exact_value_avg": 0.31038954854011536, "regret_dist": 0.4933878183364868, "regret_other_env": 0.7608258128166199, "regret_corner": 0.09223081916570663, "regret_row": 0.5791019201278687, "regret_any": 0.7608258128166199, "regret_bot": 0.7904680371284485, "value_dist": 0.31038954854011536, "value_other_env": 0.06872732192277908, "value_corner": 0.6728828549385071, "value_row": 0.2175871878862381, "value_any": 0.06872732192277908, "value_bot": 0.006221013143658638, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00123.png", "entropy": 0.7125924825668335} +{"ts": "2026-01-29T21:28:27.205986Z", "loop": 124, "env_steps": 76185600, "exact_value_avg": 0.31009647250175476, "regret_dist": 0.4936809241771698, "regret_other_env": 0.7608516812324524, "regret_corner": 0.09292472898960114, "regret_row": 0.5760591626167297, "regret_any": 0.7608516812324524, "regret_bot": 0.7906685471534729, "value_dist": 0.31009647250175476, "value_other_env": 0.06870143860578537, "value_corner": 0.6721889972686768, "value_row": 0.22062987089157104, "value_any": 0.06870143860578537, "value_bot": 0.006020531058311462, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00124.png", "entropy": 0.7112347483634949} +{"ts": "2026-01-29T21:28:28.409388Z", "loop": 125, "env_steps": 76800000, "exact_value_avg": 0.3097594082355499, "regret_dist": 0.49401795864105225, "regret_other_env": 0.7608820796012878, "regret_corner": 0.09372174739837646, "regret_row": 0.5734479427337646, "regret_any": 0.7608820796012878, "regret_bot": 0.790838897228241, "value_dist": 0.3097594082355499, "value_other_env": 0.06867101788520813, "value_corner": 0.6713919639587402, "value_row": 0.22324112057685852, "value_any": 0.06867101788520813, "value_bot": 0.00585017679259181, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00125.png", "entropy": 0.7097967267036438} +{"ts": "2026-01-29T21:28:29.613798Z", "loop": 126, "env_steps": 77414400, "exact_value_avg": 0.3096819818019867, "regret_dist": 0.49409544467926025, "regret_other_env": 0.7608897686004639, "regret_corner": 0.09390389919281006, "regret_row": 0.5729236602783203, "regret_any": 0.7608897686004639, "regret_bot": 0.7908733487129211, "value_dist": 0.3096819818019867, "value_other_env": 0.0686633363366127, "value_corner": 0.6712098717689514, "value_row": 0.22376541793346405, "value_any": 0.0686633363366127, "value_bot": 0.005815652199089527, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00126.png", "entropy": 0.7094390988349915} +{"ts": "2026-01-29T21:28:30.817957Z", "loop": 127, "env_steps": 78028800, "exact_value_avg": 0.3097061216831207, "regret_dist": 0.49407124519348145, "regret_other_env": 0.7608914971351624, "regret_corner": 0.0938408300280571, "regret_row": 0.5730365514755249, "regret_any": 0.7608914971351624, "regret_bot": 0.7908679842948914, "value_dist": 0.3097061216831207, "value_other_env": 0.06866160035133362, "value_corner": 0.671272873878479, "value_row": 0.22365249693393707, "value_any": 0.06866160035133362, "value_bot": 0.005821052473038435, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00127.png", "entropy": 0.7093825340270996} +{"ts": "2026-01-29T21:28:32.021857Z", "loop": 128, "env_steps": 78643200, "exact_value_avg": 0.3098212778568268, "regret_dist": 0.4939561188220978, "regret_other_env": 0.7608864903450012, "regret_corner": 0.09356049448251724, "regret_row": 0.5738142728805542, "regret_any": 0.7608864903450012, "regret_bot": 0.7908191680908203, "value_dist": 0.3098212778568268, "value_other_env": 0.06866662204265594, "value_corner": 0.6715531945228577, "value_row": 0.222874715924263, "value_any": 0.06866662204265594, "value_bot": 0.005869871936738491, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00128.png", "entropy": 0.7096756100654602} +{"ts": "2026-01-29T21:28:33.226569Z", "loop": 129, "env_steps": 79257600, "exact_value_avg": 0.31009742617607117, "regret_dist": 0.4936799705028534, "regret_other_env": 0.7608689665794373, "regret_corner": 0.09289643168449402, "regret_row": 0.5759437680244446, "regret_any": 0.7608689665794373, "regret_bot": 0.7906832098960876, "value_dist": 0.31009742617607117, "value_other_env": 0.06868412345647812, "value_corner": 0.6722173690795898, "value_row": 0.22074531018733978, "value_any": 0.06868412345647812, "value_bot": 0.0060058156959712505, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00129.png", "entropy": 0.710604727268219} +{"ts": "2026-01-29T21:28:34.430251Z", "loop": 130, "env_steps": 79872000, "exact_value_avg": 0.31034979224205017, "regret_dist": 0.4934276342391968, "regret_other_env": 0.760855495929718, "regret_corner": 0.09228579699993134, "regret_row": 0.578356146812439, "regret_any": 0.760855495929718, "regret_bot": 0.7905275821685791, "value_dist": 0.31034979224205017, "value_other_env": 0.06869767606258392, "value_corner": 0.672827959060669, "value_row": 0.21833287179470062, "value_any": 0.06869767606258392, "value_bot": 0.006161479279398918, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00130.png", "entropy": 0.7114000916481018} +{"ts": "2026-01-29T21:28:35.633690Z", "loop": 131, "env_steps": 80486400, "exact_value_avg": 0.310580313205719, "regret_dist": 0.49319708347320557, "regret_other_env": 0.7608428597450256, "regret_corner": 0.09172835946083069, "regret_row": 0.5814692378044128, "regret_any": 0.7608428597450256, "regret_bot": 0.7903220057487488, "value_dist": 0.310580313205719, "value_other_env": 0.06871023774147034, "value_corner": 0.6733853816986084, "value_row": 0.21521979570388794, "value_any": 0.06871023774147034, "value_bot": 0.006367032416164875, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00131.png", "entropy": 0.7122323513031006} +{"ts": "2026-01-29T21:28:36.836239Z", "loop": 132, "env_steps": 81100800, "exact_value_avg": 0.31067800521850586, "regret_dist": 0.4930993914604187, "regret_other_env": 0.7608432769775391, "regret_corner": 0.09148348867893219, "regret_row": 0.5836936235427856, "regret_any": 0.7608432769775391, "regret_bot": 0.7901732921600342, "value_dist": 0.31067800521850586, "value_other_env": 0.0687098428606987, "value_corner": 0.6736302375793457, "value_row": 0.21299543976783752, "value_any": 0.0687098428606987, "value_bot": 0.006515700835734606, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00132.png", "entropy": 0.712444007396698} +{"ts": "2026-01-29T21:28:38.041539Z", "loop": 133, "env_steps": 81715200, "exact_value_avg": 0.310727059841156, "regret_dist": 0.49305030703544617, "regret_other_env": 0.760848343372345, "regret_corner": 0.09135321527719498, "regret_row": 0.5863590836524963, "regret_any": 0.760848343372345, "regret_bot": 0.7899921536445618, "value_dist": 0.310727059841156, "value_other_env": 0.06870472431182861, "value_corner": 0.6737605333328247, "value_row": 0.21032992005348206, "value_any": 0.06870472431182861, "value_bot": 0.006696891505271196, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00133.png", "entropy": 0.7124826312065125} +{"ts": "2026-01-29T21:28:39.245440Z", "loop": 134, "env_steps": 82329600, "exact_value_avg": 0.31069105863571167, "regret_dist": 0.4930863380432129, "regret_other_env": 0.7608615159988403, "regret_corner": 0.09142353385686874, "regret_row": 0.5893059372901917, "regret_any": 0.7608615159988403, "regret_bot": 0.789787769317627, "value_dist": 0.31069105863571167, "value_other_env": 0.06869159638881683, "value_corner": 0.6736901998519897, "value_row": 0.20738312602043152, "value_any": 0.06869159638881683, "value_bot": 0.006901251617819071, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00134.png", "entropy": 0.7121951580047607} +{"ts": "2026-01-29T21:28:40.451076Z", "loop": 135, "env_steps": 82944000, "exact_value_avg": 0.31061360239982605, "regret_dist": 0.4931637942790985, "regret_other_env": 0.7608741521835327, "regret_corner": 0.09159819036722183, "regret_row": 0.5914035439491272, "regret_any": 0.7608741521835327, "regret_bot": 0.7896388173103333, "value_dist": 0.31061360239982605, "value_other_env": 0.06867888569831848, "value_corner": 0.6735156178474426, "value_row": 0.2052854597568512, "value_any": 0.06867888569831848, "value_bot": 0.0070502725429832935, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00135.png", "entropy": 0.7118134498596191} +{"ts": "2026-01-29T21:28:41.655174Z", "loop": 136, "env_steps": 83558400, "exact_value_avg": 0.31047123670578003, "regret_dist": 0.49330615997314453, "regret_other_env": 0.760891318321228, "regret_corner": 0.09192835539579391, "regret_row": 0.5936287045478821, "regret_any": 0.760891318321228, "regret_bot": 0.789478063583374, "value_dist": 0.31047123670578003, "value_other_env": 0.06866175681352615, "value_corner": 0.673185408115387, "value_row": 0.20306037366390228, "value_any": 0.06866175681352615, "value_bot": 0.007210999261587858, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00136.png", "entropy": 0.7113050818443298} +{"ts": "2026-01-29T21:28:42.861642Z", "loop": 137, "env_steps": 84172800, "exact_value_avg": 0.31037232279777527, "regret_dist": 0.4934050440788269, "regret_other_env": 0.7609033584594727, "regret_corner": 0.09215748310089111, "regret_row": 0.5949164628982544, "regret_any": 0.7609033584594727, "regret_bot": 0.7893835306167603, "value_dist": 0.31037232279777527, "value_other_env": 0.06864971667528152, "value_corner": 0.6729562282562256, "value_row": 0.2017725557088852, "value_any": 0.06864971667528152, "value_bot": 0.007305471692234278, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00137.png", "entropy": 0.710905134677887} +{"ts": "2026-01-29T21:28:44.067094Z", "loop": 138, "env_steps": 84787200, "exact_value_avg": 0.31028270721435547, "regret_dist": 0.4934946596622467, "regret_other_env": 0.7609147429466248, "regret_corner": 0.09236447513103485, "regret_row": 0.595908522605896, "regret_any": 0.7609147429466248, "regret_bot": 0.7893101572990417, "value_dist": 0.31028270721435547, "value_other_env": 0.06863836199045181, "value_corner": 0.6727492213249207, "value_row": 0.20078057050704956, "value_any": 0.06863836199045181, "value_bot": 0.007378843147307634, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00138.png", "entropy": 0.7105282545089722} +{"ts": "2026-01-29T21:28:45.271796Z", "loop": 139, "env_steps": 85401600, "exact_value_avg": 0.310221791267395, "regret_dist": 0.49355560541152954, "regret_other_env": 0.7609241604804993, "regret_corner": 0.09250275790691376, "regret_row": 0.5965561270713806, "regret_any": 0.7609241604804993, "regret_bot": 0.7892633080482483, "value_dist": 0.310221791267395, "value_other_env": 0.06862897425889969, "value_corner": 0.6726109981536865, "value_row": 0.20013290643692017, "value_any": 0.06862897425889969, "value_bot": 0.007425770163536072, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00139.png", "entropy": 0.7102125287055969} +{"ts": "2026-01-29T21:28:46.477226Z", "loop": 140, "env_steps": 86016000, "exact_value_avg": 0.3103148937225342, "regret_dist": 0.4934625029563904, "regret_other_env": 0.7609164118766785, "regret_corner": 0.09228159487247467, "regret_row": 0.5956242680549622, "regret_any": 0.7609164118766785, "regret_bot": 0.789333701133728, "value_dist": 0.3103148937225342, "value_other_env": 0.0686367079615593, "value_corner": 0.6728321313858032, "value_row": 0.20106473565101624, "value_any": 0.0686367079615593, "value_bot": 0.007355351001024246, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00140.png", "entropy": 0.7104616761207581} +{"ts": "2026-01-29T21:28:47.681515Z", "loop": 141, "env_steps": 86630400, "exact_value_avg": 0.3104938566684723, "regret_dist": 0.49328354001045227, "regret_other_env": 0.7609005570411682, "regret_corner": 0.09185800701379776, "regret_row": 0.5935149788856506, "regret_any": 0.7609005570411682, "regret_bot": 0.7894896268844604, "value_dist": 0.3104938566684723, "value_other_env": 0.06865257769823074, "value_corner": 0.6732557415962219, "value_row": 0.20317400991916656, "value_any": 0.06865257769823074, "value_bot": 0.007199437357485294, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00141.png", "entropy": 0.7109812498092651} +{"ts": "2026-01-29T21:28:48.887352Z", "loop": 142, "env_steps": 87244800, "exact_value_avg": 0.3106542229652405, "regret_dist": 0.49312323331832886, "regret_other_env": 0.7608842849731445, "regret_corner": 0.09148159623146057, "regret_row": 0.5909075140953064, "regret_any": 0.7608842849731445, "regret_bot": 0.7896788120269775, "value_dist": 0.3106542229652405, "value_other_env": 0.0686689093708992, "value_corner": 0.6736321449279785, "value_row": 0.20578151941299438, "value_any": 0.0686689093708992, "value_bot": 0.007010250352323055, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00142.png", "entropy": 0.7113951444625854} +{"ts": "2026-01-29T21:28:50.092481Z", "loop": 143, "env_steps": 87859200, "exact_value_avg": 0.3107425570487976, "regret_dist": 0.49303480982780457, "regret_other_env": 0.7608726024627686, "regret_corner": 0.0912780836224556, "regret_row": 0.5878311395645142, "regret_any": 0.7608726024627686, "regret_bot": 0.7898962497711182, "value_dist": 0.3107425570487976, "value_other_env": 0.06868049502372742, "value_corner": 0.6738356351852417, "value_row": 0.208857923746109, "value_any": 0.06868049502372742, "value_bot": 0.006792852189391851, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00143.png", "entropy": 0.711610734462738} +{"ts": "2026-01-29T21:28:51.299271Z", "loop": 144, "env_steps": 88473600, "exact_value_avg": 0.310729444026947, "regret_dist": 0.49304795265197754, "regret_other_env": 0.7608708143234253, "regret_corner": 0.0913136675953865, "regret_row": 0.5843400359153748, "regret_any": 0.7608708143234253, "regret_bot": 0.7901370525360107, "value_dist": 0.310729444026947, "value_other_env": 0.06868235766887665, "value_corner": 0.6738000512123108, "value_row": 0.2123490273952484, "value_any": 0.06868235766887665, "value_bot": 0.006551947444677353, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00144.png", "entropy": 0.7113768458366394} +{"ts": "2026-01-29T21:28:52.505304Z", "loop": 145, "env_steps": 89088000, "exact_value_avg": 0.31065574288368225, "regret_dist": 0.4931216239929199, "regret_other_env": 0.7608746886253357, "regret_corner": 0.09149197489023209, "regret_row": 0.5822780132293701, "regret_any": 0.7608746886253357, "regret_bot": 0.7902770638465881, "value_dist": 0.31065574288368225, "value_other_env": 0.0686783418059349, "value_corner": 0.6736217737197876, "value_row": 0.21441106498241425, "value_any": 0.0686783418059349, "value_bot": 0.006411920767277479, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00145.png", "entropy": 0.7110351920127869} +{"ts": "2026-01-29T21:28:53.710311Z", "loop": 146, "env_steps": 89702400, "exact_value_avg": 0.31059399247169495, "regret_dist": 0.493183434009552, "regret_other_env": 0.7608811259269714, "regret_corner": 0.09163682162761688, "regret_row": 0.5810220241546631, "regret_any": 0.7608811259269714, "regret_bot": 0.7903622388839722, "value_dist": 0.31059399247169495, "value_other_env": 0.06867200136184692, "value_corner": 0.6734769344329834, "value_row": 0.2156670242547989, "value_any": 0.06867200136184692, "value_bot": 0.0063268025405704975, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00146.png", "entropy": 0.7106412053108215} +{"ts": "2026-01-29T21:28:54.925084Z", "loop": 147, "env_steps": 90316800, "exact_value_avg": 0.3105417788028717, "regret_dist": 0.49323561787605286, "regret_other_env": 0.7608859539031982, "regret_corner": 0.0917600691318512, "regret_row": 0.5802434086799622, "regret_any": 0.7608859539031982, "regret_bot": 0.7904143929481506, "value_dist": 0.3105417788028717, "value_other_env": 0.06866716593503952, "value_corner": 0.6733536720275879, "value_row": 0.21644560992717743, "value_any": 0.06866716593503952, "value_bot": 0.006274650804698467, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00147.png", "entropy": 0.7103914022445679} +{"ts": "2026-01-29T21:28:56.128278Z", "loop": 148, "env_steps": 90931200, "exact_value_avg": 0.31055548787117004, "regret_dist": 0.4932219386100769, "regret_other_env": 0.7608876824378967, "regret_corner": 0.09172326326370239, "regret_row": 0.5803890824317932, "regret_any": 0.7608876824378967, "regret_bot": 0.7904051542282104, "value_dist": 0.31055548787117004, "value_other_env": 0.06866543740034103, "value_corner": 0.6733905076980591, "value_row": 0.21629993617534637, "value_any": 0.06866543740034103, "value_bot": 0.006283909548074007, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00148.png", "entropy": 0.7103440761566162} +{"ts": "2026-01-29T21:28:57.332346Z", "loop": 149, "env_steps": 91545600, "exact_value_avg": 0.3106324374675751, "regret_dist": 0.4931449890136719, "regret_other_env": 0.7608864903450012, "regret_corner": 0.09153266251087189, "regret_row": 0.5815862417221069, "regret_any": 0.7608864903450012, "regret_bot": 0.7903257012367249, "value_dist": 0.3106324374675751, "value_other_env": 0.06866663694381714, "value_corner": 0.6735811233520508, "value_row": 0.21510279178619385, "value_any": 0.06866663694381714, "value_bot": 0.006363394670188427, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00149.png", "entropy": 0.7105134129524231} +{"ts": "2026-01-29T21:28:58.540275Z", "loop": 150, "env_steps": 92160000, "exact_value_avg": 0.31065481901168823, "regret_dist": 0.49312257766723633, "regret_other_env": 0.760891318321228, "regret_corner": 0.09146946668624878, "regret_row": 0.5818850994110107, "regret_any": 0.760891318321228, "regret_bot": 0.7903074026107788, "value_dist": 0.31065481901168823, "value_other_env": 0.06866180151700974, "value_corner": 0.6736443042755127, "value_row": 0.21480397880077362, "value_any": 0.06866180151700974, "value_bot": 0.0063815852627158165, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00150.png", "entropy": 0.7103561162948608} +{"ts": "2026-01-29T21:28:59.745408Z", "loop": 151, "env_steps": 92774400, "exact_value_avg": 0.3106604814529419, "regret_dist": 0.49311694502830505, "regret_other_env": 0.7608959674835205, "regret_corner": 0.0914483442902565, "regret_row": 0.5818158388137817, "regret_any": 0.7608959674835205, "regret_bot": 0.790313720703125, "value_dist": 0.3106604814529419, "value_other_env": 0.06865717470645905, "value_corner": 0.6736654043197632, "value_row": 0.21487319469451904, "value_any": 0.06865717470645905, "value_bot": 0.006375416647642851, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00151.png", "entropy": 0.7101573348045349} +{"ts": "2026-01-29T21:29:00.948754Z", "loop": 152, "env_steps": 93388800, "exact_value_avg": 0.31067442893981934, "regret_dist": 0.4931029677391052, "regret_other_env": 0.7608978748321533, "regret_corner": 0.09141059219837189, "regret_row": 0.5821499824523926, "regret_any": 0.7608978748321533, "regret_bot": 0.7902916669845581, "value_dist": 0.31067442893981934, "value_other_env": 0.06865531206130981, "value_corner": 0.6737030744552612, "value_row": 0.2145390808582306, "value_any": 0.06865531206130981, "value_bot": 0.0063973418436944485, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00152.png", "entropy": 0.7101336717605591} +{"ts": "2026-01-29T21:29:02.155495Z", "loop": 153, "env_steps": 94003200, "exact_value_avg": 0.3106946349143982, "regret_dist": 0.49308285117149353, "regret_other_env": 0.7608985900878906, "regret_corner": 0.09135914593935013, "regret_row": 0.5825114250183105, "regret_any": 0.7608985900878906, "regret_bot": 0.7902683019638062, "value_dist": 0.3106946349143982, "value_other_env": 0.06865456700325012, "value_corner": 0.6737546920776367, "value_row": 0.21417762339115143, "value_any": 0.06865456700325012, "value_bot": 0.006420742254704237, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00153.png", "entropy": 0.7100942730903625} +{"ts": "2026-01-29T21:29:03.364116Z", "loop": 154, "env_steps": 94617600, "exact_value_avg": 0.31073713302612305, "regret_dist": 0.49304020404815674, "regret_other_env": 0.7609001994132996, "regret_corner": 0.09125020354986191, "regret_row": 0.5835577845573425, "regret_any": 0.7609001994132996, "regret_bot": 0.7901976108551025, "value_dist": 0.31073713302612305, "value_other_env": 0.06865289062261581, "value_corner": 0.6738635301589966, "value_row": 0.21313124895095825, "value_any": 0.06865289062261581, "value_bot": 0.006491422653198242, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00154.png", "entropy": 0.7101793885231018} +{"ts": "2026-01-29T21:29:04.564651Z", "loop": 155, "env_steps": 95232000, "exact_value_avg": 0.3107633590698242, "regret_dist": 0.49301397800445557, "regret_other_env": 0.7609009146690369, "regret_corner": 0.09118357300758362, "regret_row": 0.5844248533248901, "regret_any": 0.7609009146690369, "regret_bot": 0.7901400923728943, "value_dist": 0.3107633590698242, "value_other_env": 0.06865210831165314, "value_corner": 0.6739301681518555, "value_row": 0.21226418018341064, "value_any": 0.06865210831165314, "value_bot": 0.006548919714987278, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00155.png", "entropy": 0.7102162837982178} +{"ts": "2026-01-29T21:29:05.765453Z", "loop": 156, "env_steps": 95846400, "exact_value_avg": 0.3107874393463135, "regret_dist": 0.4929899275302887, "regret_other_env": 0.760904848575592, "regret_corner": 0.09111746400594711, "regret_row": 0.5853701829910278, "regret_any": 0.760904848575592, "regret_bot": 0.7900760173797607, "value_dist": 0.3107874393463135, "value_other_env": 0.06864822655916214, "value_corner": 0.6739962697029114, "value_row": 0.21131889522075653, "value_any": 0.06864822655916214, "value_bot": 0.006612974219024181, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00156.png", "entropy": 0.710137665271759} +{"ts": "2026-01-29T21:29:06.965827Z", "loop": 157, "env_steps": 96460800, "exact_value_avg": 0.31079864501953125, "regret_dist": 0.4929787516593933, "regret_other_env": 0.7609108686447144, "regret_corner": 0.09108049422502518, "regret_row": 0.5871005654335022, "regret_any": 0.7609108686447144, "regret_bot": 0.7899582982063293, "value_dist": 0.31079864501953125, "value_other_env": 0.06864222139120102, "value_corner": 0.6740332245826721, "value_row": 0.20958852767944336, "value_any": 0.06864222139120102, "value_bot": 0.006730755791068077, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00157.png", "entropy": 0.7100344300270081} +{"ts": "2026-01-29T21:29:08.167799Z", "loop": 158, "env_steps": 97075200, "exact_value_avg": 0.3107856214046478, "regret_dist": 0.49299174547195435, "regret_other_env": 0.7609198093414307, "regret_corner": 0.09109961241483688, "regret_row": 0.5884027481079102, "regret_any": 0.7609198093414307, "regret_bot": 0.7898692488670349, "value_dist": 0.3107856214046478, "value_other_env": 0.06863325834274292, "value_corner": 0.674014151096344, "value_row": 0.20828630030155182, "value_any": 0.06863325834274292, "value_bot": 0.006819873582571745, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00158.png", "entropy": 0.7097845077514648} +{"ts": "2026-01-29T21:29:09.367244Z", "loop": 159, "env_steps": 97689600, "exact_value_avg": 0.3107554316520691, "regret_dist": 0.4930219352245331, "regret_other_env": 0.7609317898750305, "regret_corner": 0.09115713834762573, "regret_row": 0.5899625420570374, "regret_any": 0.7609317898750305, "regret_bot": 0.7897610664367676, "value_dist": 0.3107554316520691, "value_other_env": 0.06862132251262665, "value_corner": 0.673956573009491, "value_row": 0.206726536154747, "value_any": 0.06862132251262665, "value_bot": 0.006928000133484602, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00159.png", "entropy": 0.7094632387161255} +{"ts": "2026-01-29T21:29:10.567151Z", "loop": 160, "env_steps": 98304000, "exact_value_avg": 0.3106521964073181, "regret_dist": 0.49312517046928406, "regret_other_env": 0.7609466910362244, "regret_corner": 0.09139285236597061, "regret_row": 0.5922412872314453, "regret_any": 0.7609466910362244, "regret_bot": 0.7895986437797546, "value_dist": 0.3106521964073181, "value_other_env": 0.06860639154911041, "value_corner": 0.6737208962440491, "value_row": 0.20444771647453308, "value_any": 0.06860639154911041, "value_bot": 0.007090345956385136, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00160.png", "entropy": 0.7089881896972656} +{"ts": "2026-01-29T21:29:11.769627Z", "loop": 161, "env_steps": 98918400, "exact_value_avg": 0.31050223112106323, "regret_dist": 0.49327516555786133, "regret_other_env": 0.7609688639640808, "regret_corner": 0.09173456579446793, "regret_row": 0.5944663286209106, "regret_any": 0.7609688639640808, "regret_bot": 0.7894386649131775, "value_dist": 0.31050223112106323, "value_other_env": 0.06858421862125397, "value_corner": 0.6733791828155518, "value_row": 0.20222271978855133, "value_any": 0.06858421862125397, "value_bot": 0.00725045520812273, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00161.png", "entropy": 0.7082409262657166} +{"ts": "2026-01-29T21:29:12.972220Z", "loop": 162, "env_steps": 99532800, "exact_value_avg": 0.310285359621048, "regret_dist": 0.4934920370578766, "regret_other_env": 0.7609961628913879, "regret_corner": 0.09223583340644836, "regret_row": 0.5967813730239868, "regret_any": 0.7609961628913879, "regret_bot": 0.7892686128616333, "value_dist": 0.310285359621048, "value_other_env": 0.06855695694684982, "value_corner": 0.6728779077529907, "value_row": 0.19990770518779755, "value_any": 0.06855695694684982, "value_bot": 0.007420457433909178, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00162.png", "entropy": 0.7073400616645813} +{"ts": "2026-01-29T21:29:14.175026Z", "loop": 163, "env_steps": 100147200, "exact_value_avg": 0.31011009216308594, "regret_dist": 0.49366724491119385, "regret_other_env": 0.7610192894935608, "regret_corner": 0.09263910353183746, "regret_row": 0.5983436703681946, "regret_any": 0.7610192894935608, "regret_bot": 0.7891520857810974, "value_dist": 0.31011009216308594, "value_other_env": 0.0685337483882904, "value_corner": 0.6724745631217957, "value_row": 0.1983453631401062, "value_any": 0.0685337483882904, "value_bot": 0.007536927703768015, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00163.png", "entropy": 0.7065001130104065} +{"ts": "2026-01-29T21:29:15.380421Z", "loop": 164, "env_steps": 100761600, "exact_value_avg": 0.31005337834358215, "regret_dist": 0.49372398853302, "regret_other_env": 0.7610323429107666, "regret_corner": 0.09276141226291656, "regret_row": 0.5989218950271606, "regret_any": 0.7610323429107666, "regret_bot": 0.7891108393669128, "value_dist": 0.31005337834358215, "value_other_env": 0.06852075457572937, "value_corner": 0.6723523139953613, "value_row": 0.19776716828346252, "value_any": 0.06852075457572937, "value_bot": 0.007578257005661726, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00164.png", "entropy": 0.7059895992279053} +{"ts": "2026-01-29T21:29:16.584647Z", "loop": 165, "env_steps": 101376000, "exact_value_avg": 0.3100970387458801, "regret_dist": 0.49368029832839966, "regret_other_env": 0.7610381841659546, "regret_corner": 0.09264342486858368, "regret_row": 0.5986228585243225, "regret_any": 0.7610381841659546, "regret_bot": 0.7891366481781006, "value_dist": 0.3100970387458801, "value_other_env": 0.06851491332054138, "value_corner": 0.6724702715873718, "value_row": 0.19806621968746185, "value_any": 0.06851491332054138, "value_bot": 0.007552360650151968, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00165.png", "entropy": 0.7057738304138184} +{"ts": "2026-01-29T21:29:17.789763Z", "loop": 166, "env_steps": 101990400, "exact_value_avg": 0.31041666865348816, "regret_dist": 0.4933607578277588, "regret_other_env": 0.7610143423080444, "regret_corner": 0.09188033640384674, "regret_row": 0.595843493938446, "regret_any": 0.7610143423080444, "regret_bot": 0.7893472909927368, "value_dist": 0.31041666865348816, "value_other_env": 0.06853879243135452, "value_corner": 0.6732334494590759, "value_row": 0.20084550976753235, "value_any": 0.06853879243135452, "value_bot": 0.007341776974499226, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00166.png", "entropy": 0.7065109610557556} +{"ts": "2026-01-29T21:29:18.999076Z", "loop": 167, "env_steps": 102604800, "exact_value_avg": 0.31064170598983765, "regret_dist": 0.49313563108444214, "regret_other_env": 0.7609967589378357, "regret_corner": 0.09134393185377121, "regret_row": 0.5931615233421326, "regret_any": 0.7609967589378357, "regret_bot": 0.7895457744598389, "value_dist": 0.31064170598983765, "value_other_env": 0.06855633109807968, "value_corner": 0.6737697720527649, "value_row": 0.20352748036384583, "value_any": 0.06855633109807968, "value_bot": 0.0071432990953326225, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00167.png", "entropy": 0.7070050835609436} +{"ts": "2026-01-29T21:29:20.204367Z", "loop": 168, "env_steps": 103219200, "exact_value_avg": 0.31084302067756653, "regret_dist": 0.4929344058036804, "regret_other_env": 0.7609817385673523, "regret_corner": 0.09086333960294724, "regret_row": 0.5890636444091797, "regret_any": 0.7609817385673523, "regret_bot": 0.7898394465446472, "value_dist": 0.31084302067756653, "value_other_env": 0.06857141107320786, "value_corner": 0.6742504239082336, "value_row": 0.20762543380260468, "value_any": 0.06857141107320786, "value_bot": 0.006849517114460468, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00168.png", "entropy": 0.7072973251342773} +{"ts": "2026-01-29T21:29:21.408677Z", "loop": 169, "env_steps": 103833600, "exact_value_avg": 0.31086671352386475, "regret_dist": 0.4929106831550598, "regret_other_env": 0.7609812617301941, "regret_corner": 0.09080478549003601, "regret_row": 0.5851110816001892, "regret_any": 0.7609812617301941, "regret_bot": 0.7901141047477722, "value_dist": 0.31086671352386475, "value_other_env": 0.06857185810804367, "value_corner": 0.6743089556694031, "value_row": 0.21157792210578918, "value_any": 0.06857185810804367, "value_bot": 0.00657501770183444, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00169.png", "entropy": 0.7069923877716064} +{"ts": "2026-01-29T21:29:22.614308Z", "loop": 170, "env_steps": 104448000, "exact_value_avg": 0.31070879101753235, "regret_dist": 0.4930686056613922, "regret_other_env": 0.7609911561012268, "regret_corner": 0.09118475019931793, "regret_row": 0.5810161828994751, "regret_any": 0.7609911561012268, "regret_bot": 0.7903895378112793, "value_dist": 0.31070879101753235, "value_other_env": 0.06856198608875275, "value_corner": 0.67392897605896, "value_row": 0.2156728059053421, "value_any": 0.06856198608875275, "value_bot": 0.0062995245680212975, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00170.png", "entropy": 0.706217885017395} +{"ts": "2026-01-29T21:29:23.820352Z", "loop": 171, "env_steps": 105062400, "exact_value_avg": 0.3105025291442871, "regret_dist": 0.49327486753463745, "regret_other_env": 0.7610052824020386, "regret_corner": 0.09167919307947159, "regret_row": 0.5782408714294434, "regret_any": 0.7610052824020386, "regret_bot": 0.7905723452568054, "value_dist": 0.3105025291442871, "value_other_env": 0.06854787468910217, "value_corner": 0.6734344959259033, "value_row": 0.21844814717769623, "value_any": 0.06854787468910217, "value_bot": 0.006116725038737059, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00171.png", "entropy": 0.7053738236427307} +{"ts": "2026-01-29T21:29:25.024004Z", "loop": 172, "env_steps": 105676800, "exact_value_avg": 0.31029996275901794, "regret_dist": 0.4934774339199066, "regret_other_env": 0.7610203623771667, "regret_corner": 0.09216301143169403, "regret_row": 0.5762884616851807, "regret_any": 0.7610203623771667, "regret_bot": 0.7906991243362427, "value_dist": 0.31029996275901794, "value_other_env": 0.0685327798128128, "value_corner": 0.6729507446289062, "value_row": 0.22040057182312012, "value_any": 0.0685327798128128, "value_bot": 0.005989880301058292, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00172.png", "entropy": 0.7045855522155762} +{"ts": "2026-01-29T21:29:26.228058Z", "loop": 173, "env_steps": 106291200, "exact_value_avg": 0.3101738691329956, "regret_dist": 0.49360349774360657, "regret_other_env": 0.7610307335853577, "regret_corner": 0.09246262162923813, "regret_row": 0.5752664804458618, "regret_any": 0.7610307335853577, "regret_bot": 0.7907653450965881, "value_dist": 0.3101738691329956, "value_other_env": 0.0685223788022995, "value_corner": 0.6726510524749756, "value_row": 0.22142252326011658, "value_any": 0.0685223788022995, "value_bot": 0.005923704244196415, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00173.png", "entropy": 0.7040427923202515} +{"ts": "2026-01-29T21:29:27.432898Z", "loop": 174, "env_steps": 106905600, "exact_value_avg": 0.3100740611553192, "regret_dist": 0.49370333552360535, "regret_other_env": 0.761042594909668, "regret_corner": 0.09269437938928604, "regret_row": 0.5744368433952332, "regret_any": 0.761042594909668, "regret_bot": 0.7908191084861755, "value_dist": 0.3100740611553192, "value_other_env": 0.068510502576828, "value_corner": 0.6724193692207336, "value_row": 0.22225220501422882, "value_any": 0.068510502576828, "value_bot": 0.005869962275028229, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00174.png", "entropy": 0.7035025358200073} +{"ts": "2026-01-29T21:29:28.637177Z", "loop": 175, "env_steps": 107520000, "exact_value_avg": 0.31006017327308655, "regret_dist": 0.4937172532081604, "regret_other_env": 0.7610456943511963, "regret_corner": 0.09272453933954239, "regret_row": 0.5743347406387329, "regret_any": 0.7610456943511963, "regret_bot": 0.7908267378807068, "value_dist": 0.31006017327308655, "value_other_env": 0.06850749999284744, "value_corner": 0.6723892092704773, "value_row": 0.22235430777072906, "value_any": 0.06850749999284744, "value_bot": 0.005862319841980934, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00175.png", "entropy": 0.703337550163269} +{"ts": "2026-01-29T21:29:29.841338Z", "loop": 176, "env_steps": 108134400, "exact_value_avg": 0.3100775480270386, "regret_dist": 0.4936997592449188, "regret_other_env": 0.7610475420951843, "regret_corner": 0.09267809242010117, "regret_row": 0.5744224786758423, "regret_any": 0.7610475420951843, "regret_bot": 0.7908220291137695, "value_dist": 0.3100775480270386, "value_other_env": 0.06850551813840866, "value_corner": 0.6724355816841125, "value_row": 0.2222665399312973, "value_any": 0.06850551813840866, "value_bot": 0.00586703373119235, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00176.png", "entropy": 0.7032464146614075} +{"ts": "2026-01-29T21:29:31.045406Z", "loop": 177, "env_steps": 108748800, "exact_value_avg": 0.31026166677474976, "regret_dist": 0.4935157299041748, "regret_other_env": 0.7610365152359009, "regret_corner": 0.0922345370054245, "regret_row": 0.5757848620414734, "regret_any": 0.7610365152359009, "regret_bot": 0.7907350063323975, "value_dist": 0.31026166677474976, "value_other_env": 0.06851660460233688, "value_corner": 0.6728792190551758, "value_row": 0.220904141664505, "value_any": 0.06851660460233688, "value_bot": 0.005954015534371138, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00177.png", "entropy": 0.7037484049797058} +{"ts": "2026-01-29T21:29:32.248062Z", "loop": 178, "env_steps": 109363200, "exact_value_avg": 0.31044456362724304, "regret_dist": 0.4933328330516815, "regret_other_env": 0.76102614402771, "regret_corner": 0.09179277718067169, "regret_row": 0.5774034261703491, "regret_any": 0.76102614402771, "regret_bot": 0.7906316518783569, "value_dist": 0.31044456362724304, "value_other_env": 0.06852696090936661, "value_corner": 0.6733209490776062, "value_row": 0.21928562223911285, "value_any": 0.06852696090936661, "value_bot": 0.006057476159185171, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00178.png", "entropy": 0.7043164968490601} +{"ts": "2026-01-29T21:29:33.450575Z", "loop": 179, "env_steps": 109977600, "exact_value_avg": 0.3105965256690979, "regret_dist": 0.4931808412075043, "regret_other_env": 0.7610176801681519, "regret_corner": 0.09142555296421051, "regret_row": 0.5791068077087402, "regret_any": 0.7610176801681519, "regret_bot": 0.7905208468437195, "value_dist": 0.3105965256690979, "value_other_env": 0.06853541731834412, "value_corner": 0.6736881732940674, "value_row": 0.21758218109607697, "value_any": 0.06853541731834412, "value_bot": 0.00616820203140378, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00179.png", "entropy": 0.704871416091919} +{"ts": "2026-01-29T21:29:34.657536Z", "loop": 180, "env_steps": 110592000, "exact_value_avg": 0.31073886156082153, "regret_dist": 0.493038535118103, "regret_other_env": 0.7610093355178833, "regret_corner": 0.09108226746320724, "regret_row": 0.5810829401016235, "regret_any": 0.7610093355178833, "regret_bot": 0.7903904318809509, "value_dist": 0.31073886156082153, "value_other_env": 0.06854376196861267, "value_corner": 0.6740314960479736, "value_row": 0.21560607850551605, "value_any": 0.06854376196861267, "value_bot": 0.006298588123172522, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00180.png", "entropy": 0.7053639888763428} +{"ts": "2026-01-29T21:29:35.861951Z", "loop": 181, "env_steps": 111206400, "exact_value_avg": 0.31082528829574585, "regret_dist": 0.4929521083831787, "regret_other_env": 0.761006236076355, "regret_corner": 0.09087089449167252, "regret_row": 0.5827944874763489, "regret_any": 0.761006236076355, "regret_bot": 0.7902771830558777, "value_dist": 0.31082528829574585, "value_other_env": 0.0685468390583992, "value_corner": 0.6742429733276367, "value_row": 0.2138945311307907, "value_any": 0.0685468390583992, "value_bot": 0.0064118471927940845, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00181.png", "entropy": 0.7056490778923035} +{"ts": "2026-01-29T21:29:37.066621Z", "loop": 182, "env_steps": 111820800, "exact_value_avg": 0.31089574098587036, "regret_dist": 0.4928816854953766, "regret_other_env": 0.7610059976577759, "regret_corner": 0.09069517999887466, "regret_row": 0.5853443145751953, "regret_any": 0.7610059976577759, "regret_bot": 0.7901058197021484, "value_dist": 0.31089574098587036, "value_other_env": 0.06854717433452606, "value_corner": 0.674418568611145, "value_row": 0.21134473383426666, "value_any": 0.06854717433452606, "value_bot": 0.006583209149539471, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00182.png", "entropy": 0.7058747410774231} +{"ts": "2026-01-29T21:29:38.270583Z", "loop": 183, "env_steps": 112435200, "exact_value_avg": 0.3109110891819, "regret_dist": 0.49286630749702454, "regret_other_env": 0.7610131502151489, "regret_corner": 0.09064598381519318, "regret_row": 0.5877562165260315, "regret_any": 0.7610131502151489, "regret_bot": 0.789941132068634, "value_dist": 0.3109110891819, "value_other_env": 0.06853996962308884, "value_corner": 0.6744677424430847, "value_row": 0.20893290638923645, "value_any": 0.06853996962308884, "value_bot": 0.006747896317392588, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00183.png", "entropy": 0.7057856917381287} +{"ts": "2026-01-29T21:29:39.478364Z", "loop": 184, "env_steps": 113049600, "exact_value_avg": 0.31084489822387695, "regret_dist": 0.4929324686527252, "regret_other_env": 0.7610241770744324, "regret_corner": 0.09079483151435852, "regret_row": 0.5905054807662964, "regret_any": 0.7610241770744324, "regret_bot": 0.7897489070892334, "value_dist": 0.31084489822387695, "value_other_env": 0.068528912961483, "value_corner": 0.6743189096450806, "value_row": 0.20618359744548798, "value_any": 0.068528912961483, "value_bot": 0.0069401320070028305, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00184.png", "entropy": 0.7055110335350037} +{"ts": "2026-01-29T21:29:40.683519Z", "loop": 185, "env_steps": 113664000, "exact_value_avg": 0.31069058179855347, "regret_dist": 0.4930868446826935, "regret_other_env": 0.7610452771186829, "regret_corner": 0.09114912897348404, "regret_row": 0.5933743119239807, "regret_any": 0.7610452771186829, "regret_bot": 0.7895444631576538, "value_dist": 0.31069058179855347, "value_other_env": 0.06850789487361908, "value_corner": 0.6739646196365356, "value_row": 0.20331478118896484, "value_any": 0.06850789487361908, "value_bot": 0.007144578266888857, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00185.png", "entropy": 0.7048488259315491} +{"ts": "2026-01-29T21:29:41.887610Z", "loop": 186, "env_steps": 114278400, "exact_value_avg": 0.31051135063171387, "regret_dist": 0.4932660460472107, "regret_other_env": 0.7610669136047363, "regret_corner": 0.09156470745801926, "regret_row": 0.5956451892852783, "regret_any": 0.7610669136047363, "regret_bot": 0.7893797755241394, "value_dist": 0.31051135063171387, "value_other_env": 0.06848620623350143, "value_corner": 0.6735489964485168, "value_row": 0.20104381442070007, "value_any": 0.06848620623350143, "value_bot": 0.007309265900403261, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00186.png", "entropy": 0.7040930986404419} +{"ts": "2026-01-29T21:29:43.092069Z", "loop": 187, "env_steps": 114892800, "exact_value_avg": 0.31043997406959534, "regret_dist": 0.4933374524116516, "regret_other_env": 0.761078417301178, "regret_corner": 0.0917259231209755, "regret_row": 0.5964161157608032, "regret_any": 0.761078417301178, "regret_bot": 0.7893238067626953, "value_dist": 0.31043997406959534, "value_other_env": 0.06847469508647919, "value_corner": 0.6733878254890442, "value_row": 0.20027296245098114, "value_any": 0.06847469508647919, "value_bot": 0.007365264929831028, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00187.png", "entropy": 0.703681230545044} +{"ts": "2026-01-29T21:29:44.296214Z", "loop": 188, "env_steps": 115507200, "exact_value_avg": 0.31046152114868164, "regret_dist": 0.4933159053325653, "regret_other_env": 0.7610804438591003, "regret_corner": 0.09166905283927917, "regret_row": 0.5962620377540588, "regret_any": 0.7610804438591003, "regret_bot": 0.7893354892730713, "value_dist": 0.31046152114868164, "value_other_env": 0.06847269833087921, "value_corner": 0.6734447479248047, "value_row": 0.20042698085308075, "value_any": 0.06847269833087921, "value_bot": 0.007353568449616432, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00188.png", "entropy": 0.7035825252532959} +{"ts": "2026-01-29T21:29:45.501894Z", "loop": 189, "env_steps": 116121600, "exact_value_avg": 0.31055188179016113, "regret_dist": 0.4932255446910858, "regret_other_env": 0.761073112487793, "regret_corner": 0.09145414084196091, "regret_row": 0.5953479409217834, "regret_any": 0.761073112487793, "regret_bot": 0.7894035577774048, "value_dist": 0.31055188179016113, "value_other_env": 0.0684799998998642, "value_corner": 0.67365962266922, "value_row": 0.20134112238883972, "value_any": 0.0684799998998642, "value_bot": 0.007285583298653364, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00189.png", "entropy": 0.703778088092804} +{"ts": "2026-01-29T21:29:46.705829Z", "loop": 190, "env_steps": 116736000, "exact_value_avg": 0.3106641471385956, "regret_dist": 0.493113249540329, "regret_other_env": 0.7610636949539185, "regret_corner": 0.0911875069141388, "regret_row": 0.5939810872077942, "regret_any": 0.7610636949539185, "regret_bot": 0.7895036935806274, "value_dist": 0.3106641471385956, "value_other_env": 0.06848940253257751, "value_corner": 0.6739262342453003, "value_row": 0.20270796120166779, "value_any": 0.06848940253257751, "value_bot": 0.007185418624430895, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00190.png", "entropy": 0.7040886878967285} +{"ts": "2026-01-29T21:29:47.910811Z", "loop": 191, "env_steps": 117350400, "exact_value_avg": 0.3107161521911621, "regret_dist": 0.49306124448776245, "regret_other_env": 0.7610595226287842, "regret_corner": 0.09106376022100449, "regret_row": 0.5932396650314331, "regret_any": 0.7610595226287842, "regret_bot": 0.7895583510398865, "value_dist": 0.3107161521911621, "value_other_env": 0.06849360466003418, "value_corner": 0.6740499138832092, "value_row": 0.20344939827919006, "value_any": 0.06849360466003418, "value_bot": 0.007130784448236227, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00191.png", "entropy": 0.704199492931366} +{"ts": "2026-01-29T21:29:49.114652Z", "loop": 192, "env_steps": 117964800, "exact_value_avg": 0.310857355594635, "regret_dist": 0.49292001128196716, "regret_other_env": 0.7610491514205933, "regret_corner": 0.09072622656822205, "regret_row": 0.5908980965614319, "regret_any": 0.7610491514205933, "regret_bot": 0.7897266745567322, "value_dist": 0.310857355594635, "value_other_env": 0.06850393861532211, "value_corner": 0.674387514591217, "value_row": 0.20579098165035248, "value_any": 0.06850393861532211, "value_bot": 0.006962362676858902, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00192.png", "entropy": 0.7045072913169861} +{"ts": "2026-01-29T21:29:50.319543Z", "loop": 193, "env_steps": 118579200, "exact_value_avg": 0.31094789505004883, "regret_dist": 0.49282950162887573, "regret_other_env": 0.7610389590263367, "regret_corner": 0.09051527827978134, "regret_row": 0.5874100923538208, "regret_any": 0.7610389590263367, "regret_bot": 0.789971649646759, "value_dist": 0.31094789505004883, "value_other_env": 0.06851419806480408, "value_corner": 0.6745984554290771, "value_row": 0.20927895605564117, "value_any": 0.06851419806480408, "value_bot": 0.006717367563396692, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00193.png", "entropy": 0.7045845985412598} +{"ts": "2026-01-29T21:29:51.532472Z", "loop": 194, "env_steps": 119193600, "exact_value_avg": 0.31089070439338684, "regret_dist": 0.4928867220878601, "regret_other_env": 0.7610413432121277, "regret_corner": 0.09065467864274979, "regret_row": 0.5833143591880798, "regret_any": 0.7610413432121277, "regret_bot": 0.7902511954307556, "value_dist": 0.31089070439338684, "value_other_env": 0.06851179152727127, "value_corner": 0.6744590401649475, "value_row": 0.21337464451789856, "value_any": 0.06851179152727127, "value_bot": 0.006437912583351135, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00194.png", "entropy": 0.7041441202163696} +{"ts": "2026-01-29T21:29:52.738254Z", "loop": 195, "env_steps": 119808000, "exact_value_avg": 0.3106845021247864, "regret_dist": 0.4930928945541382, "regret_other_env": 0.7610574960708618, "regret_corner": 0.09114593267440796, "regret_row": 0.5795862078666687, "regret_any": 0.7610574960708618, "regret_bot": 0.7904988527297974, "value_dist": 0.3106845021247864, "value_other_env": 0.06849563121795654, "value_corner": 0.6739677786827087, "value_row": 0.2171027809381485, "value_any": 0.06849563121795654, "value_bot": 0.006190165411680937, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00195.png", "entropy": 0.7031877040863037} +{"ts": "2026-01-29T21:29:53.941222Z", "loop": 196, "env_steps": 120422400, "exact_value_avg": 0.31053391098976135, "regret_dist": 0.4932434558868408, "regret_other_env": 0.7610702514648438, "regret_corner": 0.09150318056344986, "regret_row": 0.5778703093528748, "regret_any": 0.7610702514648438, "regret_bot": 0.7906116843223572, "value_dist": 0.31053391098976135, "value_other_env": 0.06848283857107162, "value_corner": 0.673610508441925, "value_row": 0.2188187688589096, "value_any": 0.06848283857107162, "value_bot": 0.006077438127249479, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00196.png", "entropy": 0.7025040984153748} +{"ts": "2026-01-29T21:29:55.145319Z", "loop": 197, "env_steps": 121036800, "exact_value_avg": 0.31053420901298523, "regret_dist": 0.4932432174682617, "regret_other_env": 0.7610718607902527, "regret_corner": 0.0915001928806305, "regret_row": 0.5777996182441711, "regret_any": 0.7610718607902527, "regret_bot": 0.7906168103218079, "value_dist": 0.31053420901298523, "value_other_env": 0.06848125159740448, "value_corner": 0.6736136078834534, "value_row": 0.21888944506645203, "value_any": 0.06848125159740448, "value_bot": 0.006072251591831446, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00197.png", "entropy": 0.702392041683197} +{"ts": "2026-01-29T21:29:56.348979Z", "loop": 198, "env_steps": 121651200, "exact_value_avg": 0.3106063902378082, "regret_dist": 0.49317100644111633, "regret_other_env": 0.7610679268836975, "regret_corner": 0.091325543820858, "regret_row": 0.5786360502243042, "regret_any": 0.7610679268836975, "regret_bot": 0.7905629277229309, "value_dist": 0.3106063902378082, "value_other_env": 0.06848517805337906, "value_corner": 0.6737881898880005, "value_row": 0.21805304288864136, "value_any": 0.06848517805337906, "value_bot": 0.006126135587692261, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00198.png", "entropy": 0.7026568055152893} +{"ts": "2026-01-29T21:29:57.556455Z", "loop": 199, "env_steps": 122265600, "exact_value_avg": 0.31072044372558594, "regret_dist": 0.4930569529533386, "regret_other_env": 0.761061429977417, "regret_corner": 0.09105022996664047, "regret_row": 0.5799826979637146, "regret_any": 0.761061429977417, "regret_bot": 0.7904751896858215, "value_dist": 0.31072044372558594, "value_other_env": 0.06849174946546555, "value_corner": 0.674063503742218, "value_row": 0.2167063057422638, "value_any": 0.06849174946546555, "value_bot": 0.006213873624801636, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00199.png", "entropy": 0.7030512690544128} +{"ts": "2026-01-29T21:29:58.759737Z", "loop": 200, "env_steps": 122880000, "exact_value_avg": 0.3108333349227905, "regret_dist": 0.49294406175613403, "regret_other_env": 0.7610541582107544, "regret_corner": 0.09077886492013931, "regret_row": 0.5817883610725403, "regret_any": 0.7610541582107544, "regret_bot": 0.7903558015823364, "value_dist": 0.3108333349227905, "value_other_env": 0.06849893182516098, "value_corner": 0.6743348836898804, "value_row": 0.21490070223808289, "value_any": 0.06849893182516098, "value_bot": 0.006333252880722284, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00200.png", "entropy": 0.703474760055542} +{"ts": "2026-01-29T21:29:59.962941Z", "loop": 201, "env_steps": 123494400, "exact_value_avg": 0.31091827154159546, "regret_dist": 0.4928591847419739, "regret_other_env": 0.7610505819320679, "regret_corner": 0.09057197719812393, "regret_row": 0.5836949348449707, "regret_any": 0.7610505819320679, "regret_bot": 0.7902289628982544, "value_dist": 0.31091827154159546, "value_other_env": 0.06850256025791168, "value_corner": 0.6745417714118958, "value_row": 0.21299414336681366, "value_any": 0.06850256025791168, "value_bot": 0.006460119038820267, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00201.png", "entropy": 0.7037994861602783} +{"ts": "2026-01-29T21:30:01.166017Z", "loop": 202, "env_steps": 124108800, "exact_value_avg": 0.31096571683883667, "regret_dist": 0.49281173944473267, "regret_other_env": 0.7610515356063843, "regret_corner": 0.09045197069644928, "regret_row": 0.5862231850624084, "regret_any": 0.7610515356063843, "regret_bot": 0.7900571823120117, "value_dist": 0.31096571683883667, "value_other_env": 0.06850162148475647, "value_corner": 0.6746618151664734, "value_row": 0.21046586334705353, "value_any": 0.06850162148475647, "value_bot": 0.006631930358707905, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00202.png", "entropy": 0.7040337920188904} +{"ts": "2026-01-29T21:30:02.369430Z", "loop": 203, "env_steps": 124723200, "exact_value_avg": 0.31095215678215027, "regret_dist": 0.49282529950141907, "regret_other_env": 0.7610530853271484, "regret_corner": 0.09048354625701904, "regret_row": 0.588172435760498, "regret_any": 0.7610530853271484, "regret_bot": 0.7899228930473328, "value_dist": 0.31095215678215027, "value_other_env": 0.06850007176399231, "value_corner": 0.6746302247047424, "value_row": 0.20851664245128632, "value_any": 0.06850007176399231, "value_bot": 0.006766175385564566, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00203.png", "entropy": 0.7040992975234985} +{"ts": "2026-01-29T21:30:03.572463Z", "loop": 204, "env_steps": 125337600, "exact_value_avg": 0.3109190762042999, "regret_dist": 0.49285829067230225, "regret_other_env": 0.7610596418380737, "regret_corner": 0.09055620431900024, "regret_row": 0.5896924138069153, "regret_any": 0.7610596418380737, "regret_bot": 0.78981614112854, "value_dist": 0.3109190762042999, "value_other_env": 0.06849341839551926, "value_corner": 0.6745575070381165, "value_row": 0.2069966346025467, "value_any": 0.06849341839551926, "value_bot": 0.006872821133583784, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00204.png", "entropy": 0.7039812207221985} +{"ts": "2026-01-29T21:30:04.775509Z", "loop": 205, "env_steps": 125952000, "exact_value_avg": 0.3108784854412079, "regret_dist": 0.49289894104003906, "regret_other_env": 0.7610655426979065, "regret_corner": 0.09064894914627075, "regret_row": 0.5907253623008728, "regret_any": 0.7610655426979065, "regret_bot": 0.7897449731826782, "value_dist": 0.3108784854412079, "value_other_env": 0.06848761439323425, "value_corner": 0.674464762210846, "value_row": 0.20596368610858917, "value_any": 0.06848761439323425, "value_bot": 0.006944030523300171, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00205.png", "entropy": 0.7037675976753235} +{"ts": "2026-01-29T21:30:05.979216Z", "loop": 206, "env_steps": 126566400, "exact_value_avg": 0.31081923842430115, "regret_dist": 0.492958128452301, "regret_other_env": 0.7610752582550049, "regret_corner": 0.09078241139650345, "regret_row": 0.5921651124954224, "regret_any": 0.7610752582550049, "regret_bot": 0.7896429300308228, "value_dist": 0.31081923842430115, "value_other_env": 0.0684778168797493, "value_corner": 0.6743313074111938, "value_row": 0.2045239508152008, "value_any": 0.0684778168797493, "value_bot": 0.007046085316687822, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00206.png", "entropy": 0.7034957408905029} +{"ts": "2026-01-29T21:30:07.184150Z", "loop": 207, "env_steps": 127180800, "exact_value_avg": 0.3107357621192932, "regret_dist": 0.49304163455963135, "regret_other_env": 0.7610850930213928, "regret_corner": 0.09097639471292496, "regret_row": 0.5934855341911316, "regret_any": 0.7610850930213928, "regret_bot": 0.7895485162734985, "value_dist": 0.3107357621192932, "value_other_env": 0.06846798211336136, "value_corner": 0.6741373538970947, "value_row": 0.20320351421833038, "value_any": 0.06846798211336136, "value_bot": 0.007140511181205511, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00207.png", "entropy": 0.7031598687171936} +{"ts": "2026-01-29T21:30:08.387075Z", "loop": 208, "env_steps": 127795200, "exact_value_avg": 0.3107641339302063, "regret_dist": 0.4930132329463959, "regret_other_env": 0.761082112789154, "regret_corner": 0.09090989828109741, "regret_row": 0.5930465459823608, "regret_any": 0.761082112789154, "regret_bot": 0.7895795106887817, "value_dist": 0.3107641339302063, "value_other_env": 0.06847099214792252, "value_corner": 0.6742038726806641, "value_row": 0.20364250242710114, "value_any": 0.06847099214792252, "value_bot": 0.007109487894922495, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00208.png", "entropy": 0.7032129764556885} +{"ts": "2026-01-29T21:30:09.591417Z", "loop": 209, "env_steps": 128409600, "exact_value_avg": 0.31083008646965027, "regret_dist": 0.4929473102092743, "regret_other_env": 0.7610759139060974, "regret_corner": 0.09075432270765305, "regret_row": 0.5919864177703857, "regret_any": 0.7610759139060974, "regret_bot": 0.7896566390991211, "value_dist": 0.31083008646965027, "value_other_env": 0.06847718358039856, "value_corner": 0.6743594408035278, "value_row": 0.20470257103443146, "value_any": 0.06847718358039856, "value_bot": 0.007032440509647131, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00209.png", "entropy": 0.7033801674842834} +{"ts": "2026-01-29T21:30:10.794443Z", "loop": 210, "env_steps": 129024000, "exact_value_avg": 0.3108808994293213, "regret_dist": 0.4928964674472809, "regret_other_env": 0.7610694766044617, "regret_corner": 0.09063688665628433, "regret_row": 0.591048002243042, "regret_any": 0.7610694766044617, "regret_bot": 0.7897229790687561, "value_dist": 0.3108808994293213, "value_other_env": 0.0684836134314537, "value_corner": 0.6744768619537354, "value_row": 0.2056410312652588, "value_any": 0.0684836134314537, "value_bot": 0.0069661266170442104, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00210.png", "entropy": 0.7035036087036133} +{"ts": "2026-01-29T21:30:11.996686Z", "loop": 211, "env_steps": 129638400, "exact_value_avg": 0.31092599034309387, "regret_dist": 0.4928513765335083, "regret_other_env": 0.761062741279602, "regret_corner": 0.09053430706262589, "regret_row": 0.5897899866104126, "regret_any": 0.761062741279602, "regret_bot": 0.7898111939430237, "value_dist": 0.31092599034309387, "value_other_env": 0.06849037110805511, "value_corner": 0.6745794415473938, "value_row": 0.20689904689788818, "value_any": 0.06849037110805511, "value_bot": 0.006877831649035215, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00211.png", "entropy": 0.7036203145980835} +{"ts": "2026-01-29T21:30:13.204466Z", "loop": 212, "env_steps": 130252800, "exact_value_avg": 0.31097477674484253, "regret_dist": 0.49280259013175964, "regret_other_env": 0.7610553503036499, "regret_corner": 0.09042338281869888, "regret_row": 0.5879190564155579, "regret_any": 0.7610553503036499, "regret_bot": 0.7899402976036072, "value_dist": 0.31097477674484253, "value_other_env": 0.0684976875782013, "value_corner": 0.6746903657913208, "value_row": 0.2087700068950653, "value_any": 0.0684976875782013, "value_bot": 0.006748710758984089, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00212.png", "entropy": 0.7036977410316467} +{"ts": "2026-01-29T21:30:14.409346Z", "loop": 213, "env_steps": 130867200, "exact_value_avg": 0.3109680712223053, "regret_dist": 0.49280932545661926, "regret_other_env": 0.7610505223274231, "regret_corner": 0.09044748544692993, "regret_row": 0.5856100916862488, "regret_any": 0.7610505223274231, "regret_bot": 0.7900989651679993, "value_dist": 0.3109680712223053, "value_other_env": 0.06850262731313705, "value_corner": 0.6746662259101868, "value_row": 0.2110789567232132, "value_any": 0.06850262731313705, "value_bot": 0.006590071599930525, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00213.png", "entropy": 0.7036401629447937} +{"ts": "2026-01-29T21:30:15.611090Z", "loop": 214, "env_steps": 131481600, "exact_value_avg": 0.31092965602874756, "regret_dist": 0.4928477108478546, "regret_other_env": 0.761053204536438, "regret_corner": 0.09053945541381836, "regret_row": 0.5838028192520142, "regret_any": 0.761053204536438, "regret_bot": 0.7902218699455261, "value_dist": 0.31092965602874756, "value_other_env": 0.06849990040063858, "value_corner": 0.6745743155479431, "value_row": 0.21288619935512543, "value_any": 0.06849990040063858, "value_bot": 0.00646715285256505, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00214.png", "entropy": 0.7034395337104797} +{"ts": "2026-01-29T21:30:16.813680Z", "loop": 215, "env_steps": 132096000, "exact_value_avg": 0.3108959496021271, "regret_dist": 0.4928813874721527, "regret_other_env": 0.7610549330711365, "regret_corner": 0.09062101691961288, "regret_row": 0.5828890204429626, "regret_any": 0.7610549330711365, "regret_bot": 0.7902833819389343, "value_dist": 0.3108959496021271, "value_other_env": 0.0684981718659401, "value_corner": 0.6744926571846008, "value_row": 0.21379999816417694, "value_any": 0.0684981718659401, "value_bot": 0.006405645050108433, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00215.png", "entropy": 0.7033053636550903} +{"ts": "2026-01-29T21:30:18.015177Z", "loop": 216, "env_steps": 132710400, "exact_value_avg": 0.31087595224380493, "regret_dist": 0.49290141463279724, "regret_other_env": 0.7610574960708618, "regret_corner": 0.0906672552227974, "regret_row": 0.5823183655738831, "regret_any": 0.7610574960708618, "regret_bot": 0.7903221845626831, "value_dist": 0.31087595224380493, "value_other_env": 0.06849563121795654, "value_corner": 0.6744464635848999, "value_row": 0.21437066793441772, "value_any": 0.06849563121795654, "value_bot": 0.006366888526827097, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00216.png", "entropy": 0.7032027244567871} +{"ts": "2026-01-29T21:30:19.216779Z", "loop": 217, "env_steps": 133324800, "exact_value_avg": 0.31078994274139404, "regret_dist": 0.49298742413520813, "regret_other_env": 0.7610645294189453, "regret_corner": 0.09087176620960236, "regret_row": 0.5808152556419373, "regret_any": 0.7610645294189453, "regret_bot": 0.7904229164123535, "value_dist": 0.31078994274139404, "value_other_env": 0.06848860532045364, "value_corner": 0.6742419004440308, "value_row": 0.2158738076686859, "value_any": 0.06848860532045364, "value_bot": 0.0062661138363182545, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00217.png", "entropy": 0.7028871774673462} +{"ts": "2026-01-29T21:30:20.416712Z", "loop": 218, "env_steps": 133939200, "exact_value_avg": 0.3107927441596985, "regret_dist": 0.4929846525192261, "regret_other_env": 0.7610650658607483, "regret_corner": 0.09086401760578156, "regret_row": 0.5808911919593811, "regret_any": 0.7610650658607483, "regret_bot": 0.7904176115989685, "value_dist": 0.3107927441596985, "value_other_env": 0.06848808377981186, "value_corner": 0.6742497086524963, "value_row": 0.21579788625240326, "value_any": 0.06848808377981186, "value_bot": 0.006271433550864458, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00218.png", "entropy": 0.702926754951477} +{"ts": "2026-01-29T21:30:21.618896Z", "loop": 219, "env_steps": 134553600, "exact_value_avg": 0.3107946515083313, "regret_dist": 0.49298274517059326, "regret_other_env": 0.7610664367675781, "regret_corner": 0.09085717797279358, "regret_row": 0.5809347629547119, "regret_any": 0.7610664367675781, "regret_bot": 0.7904149293899536, "value_dist": 0.3107946515083313, "value_other_env": 0.06848667562007904, "value_corner": 0.6742565631866455, "value_row": 0.21575427055358887, "value_any": 0.06848667562007904, "value_bot": 0.006274088751524687, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00219.png", "entropy": 0.7029659152030945} +{"ts": "2026-01-29T21:30:22.820701Z", "loop": 220, "env_steps": 135168000, "exact_value_avg": 0.31083840131759644, "regret_dist": 0.49293893575668335, "regret_other_env": 0.761063277721405, "regret_corner": 0.09075238555669785, "regret_row": 0.5816890001296997, "regret_any": 0.761063277721405, "regret_bot": 0.79036545753479, "value_dist": 0.31083840131759644, "value_other_env": 0.06848976761102676, "value_corner": 0.6743613481521606, "value_row": 0.21500004827976227, "value_any": 0.06848976761102676, "value_bot": 0.0063236178830266, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00220.png", "entropy": 0.7031373381614685} +{"ts": "2026-01-29T21:30:24.022241Z", "loop": 221, "env_steps": 135782400, "exact_value_avg": 0.3109029531478882, "regret_dist": 0.4928744435310364, "regret_other_env": 0.7610601186752319, "regret_corner": 0.09059585630893707, "regret_row": 0.583092987537384, "regret_any": 0.7610601186752319, "regret_bot": 0.7902716994285583, "value_dist": 0.3109029531478882, "value_other_env": 0.06849298626184464, "value_corner": 0.6745178699493408, "value_row": 0.21359606087207794, "value_any": 0.06849298626184464, "value_bot": 0.006417331285774708, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00221.png", "entropy": 0.703407883644104} +{"ts": "2026-01-29T21:30:25.224034Z", "loop": 222, "env_steps": 136396800, "exact_value_avg": 0.3109321594238281, "regret_dist": 0.49284520745277405, "regret_other_env": 0.7610583305358887, "regret_corner": 0.09052547067403793, "regret_row": 0.5838473439216614, "regret_any": 0.7610583305358887, "regret_bot": 0.7902213335037231, "value_dist": 0.3109321594238281, "value_other_env": 0.06849472969770432, "value_corner": 0.6745883226394653, "value_row": 0.2128416746854782, "value_any": 0.06849472969770432, "value_bot": 0.006467755418270826, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00222.png", "entropy": 0.7035678625106812} +{"ts": "2026-01-29T21:30:26.428177Z", "loop": 223, "env_steps": 137011200, "exact_value_avg": 0.3109447956085205, "regret_dist": 0.4928325414657593, "regret_other_env": 0.7610554695129395, "regret_corner": 0.09049811214208603, "regret_row": 0.584520161151886, "regret_any": 0.7610554695129395, "regret_bot": 0.7901747226715088, "value_dist": 0.3109447956085205, "value_other_env": 0.06849759072065353, "value_corner": 0.6746155619621277, "value_row": 0.2121688723564148, "value_any": 0.06849759072065353, "value_bot": 0.006514330860227346, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00223.png", "entropy": 0.7037061452865601} +{"ts": "2026-01-29T21:30:27.630813Z", "loop": 224, "env_steps": 137625600, "exact_value_avg": 0.3109425902366638, "regret_dist": 0.49283477663993835, "regret_other_env": 0.7610548734664917, "regret_corner": 0.09050456434488297, "regret_row": 0.5845380425453186, "regret_any": 0.7610548734664917, "regret_bot": 0.7901737093925476, "value_dist": 0.3109425902366638, "value_other_env": 0.06849822402000427, "value_corner": 0.6746091842651367, "value_row": 0.21215097606182098, "value_any": 0.06849822402000427, "value_bot": 0.006515338085591793, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00224.png", "entropy": 0.7037597298622131} +{"ts": "2026-01-29T21:30:28.834911Z", "loop": 225, "env_steps": 138240000, "exact_value_avg": 0.3109385371208191, "regret_dist": 0.49283885955810547, "regret_other_env": 0.7610535025596619, "regret_corner": 0.09051690250635147, "regret_row": 0.5842926502227783, "regret_any": 0.7610535025596619, "regret_bot": 0.7901898622512817, "value_dist": 0.3109385371208191, "value_other_env": 0.0684996172785759, "value_corner": 0.674596905708313, "value_row": 0.21239632368087769, "value_any": 0.0684996172785759, "value_bot": 0.006499180570244789, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00225.png", "entropy": 0.7037808299064636} +{"ts": "2026-01-29T21:30:30.038734Z", "loop": 226, "env_steps": 138854400, "exact_value_avg": 0.31093889474868774, "regret_dist": 0.4928385615348816, "regret_other_env": 0.7610530853271484, "regret_corner": 0.09051672369241714, "regret_row": 0.5842238664627075, "regret_any": 0.7610530853271484, "regret_bot": 0.7901952266693115, "value_dist": 0.31093889474868774, "value_other_env": 0.06850006431341171, "value_corner": 0.6745970845222473, "value_row": 0.21246518194675446, "value_any": 0.06850006431341171, "value_bot": 0.006493783555924892, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00226.png", "entropy": 0.7037597894668579} +{"ts": "2026-01-29T21:30:31.249058Z", "loop": 227, "env_steps": 139468800, "exact_value_avg": 0.3109537661075592, "regret_dist": 0.4928235709667206, "regret_other_env": 0.7610539197921753, "regret_corner": 0.09047798812389374, "regret_row": 0.584857165813446, "regret_any": 0.7610539197921753, "regret_bot": 0.7901522517204285, "value_dist": 0.3109537661075592, "value_other_env": 0.06849916279315948, "value_corner": 0.6746357083320618, "value_row": 0.21183191239833832, "value_any": 0.06849916279315948, "value_bot": 0.006536793429404497, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00227.png", "entropy": 0.7037798762321472} +{"ts": "2026-01-29T21:30:32.452774Z", "loop": 228, "env_steps": 140083200, "exact_value_avg": 0.3109667897224426, "regret_dist": 0.49281057715415955, "regret_other_env": 0.7610548138618469, "regret_corner": 0.09044414013624191, "regret_row": 0.5855947732925415, "regret_any": 0.7610548138618469, "regret_bot": 0.7901025414466858, "value_dist": 0.3109667897224426, "value_other_env": 0.06849826127290726, "value_corner": 0.6746695637702942, "value_row": 0.21109430491924286, "value_any": 0.06849826127290726, "value_bot": 0.006586482748389244, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00228.png", "entropy": 0.703825056552887} +{"ts": "2026-01-29T21:30:33.657689Z", "loop": 229, "env_steps": 140697600, "exact_value_avg": 0.31097206473350525, "regret_dist": 0.4928053319454193, "regret_other_env": 0.7610557675361633, "regret_corner": 0.0904296264052391, "regret_row": 0.5864514708518982, "regret_any": 0.7610557675361633, "regret_bot": 0.7900440096855164, "value_dist": 0.31097206473350525, "value_other_env": 0.06849735230207443, "value_corner": 0.6746841073036194, "value_row": 0.21023757755756378, "value_any": 0.06849735230207443, "value_bot": 0.006645015440881252, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00229.png", "entropy": 0.7039046883583069} +{"ts": "2026-01-29T21:30:34.862210Z", "loop": 230, "env_steps": 141312000, "exact_value_avg": 0.3109755218029022, "regret_dist": 0.49280187487602234, "regret_other_env": 0.7610541582107544, "regret_corner": 0.09042336791753769, "regret_row": 0.586984395980835, "regret_any": 0.7610541582107544, "regret_bot": 0.7900069355964661, "value_dist": 0.3109755218029022, "value_other_env": 0.06849895417690277, "value_corner": 0.6746903657913208, "value_row": 0.20970462262630463, "value_any": 0.06849895417690277, "value_bot": 0.006682108156383038, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00230.png", "entropy": 0.7039209604263306} +{"ts": "2026-01-29T21:30:36.067224Z", "loop": 231, "env_steps": 141926400, "exact_value_avg": 0.31095612049102783, "regret_dist": 0.49282127618789673, "regret_other_env": 0.7610572576522827, "regret_corner": 0.09046729654073715, "regret_row": 0.5886505842208862, "regret_any": 0.7610572576522827, "regret_bot": 0.7898911833763123, "value_dist": 0.31095612049102783, "value_other_env": 0.06849590688943863, "value_corner": 0.6746464371681213, "value_row": 0.20803846418857574, "value_any": 0.06849590688943863, "value_bot": 0.006797899957746267, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00231.png", "entropy": 0.7039327621459961} +{"ts": "2026-01-29T21:30:37.272473Z", "loop": 232, "env_steps": 142540800, "exact_value_avg": 0.31094297766685486, "regret_dist": 0.4928344488143921, "regret_other_env": 0.7610587477684021, "regret_corner": 0.09049791842699051, "regret_row": 0.589182436466217, "regret_any": 0.7610587477684021, "regret_bot": 0.7898539900779724, "value_dist": 0.31094297766685486, "value_other_env": 0.06849436461925507, "value_corner": 0.6746158599853516, "value_row": 0.20750659704208374, "value_any": 0.06849436461925507, "value_bot": 0.006835106294602156, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00232.png", "entropy": 0.7039046883583069} +{"ts": "2026-01-29T21:30:38.477866Z", "loop": 233, "env_steps": 143155200, "exact_value_avg": 0.31093281507492065, "regret_dist": 0.4928445816040039, "regret_other_env": 0.7610582113265991, "regret_corner": 0.09052407741546631, "regret_row": 0.5893697142601013, "regret_any": 0.7610582113265991, "regret_bot": 0.7898404002189636, "value_dist": 0.31093281507492065, "value_other_env": 0.06849487125873566, "value_corner": 0.6745896935462952, "value_row": 0.20731930434703827, "value_any": 0.06849487125873566, "value_bot": 0.006848656572401524, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00233.png", "entropy": 0.7039859294891357} +{"ts": "2026-01-29T21:30:39.682929Z", "loop": 234, "env_steps": 143769600, "exact_value_avg": 0.310901403427124, "regret_dist": 0.49287599325180054, "regret_other_env": 0.7610601782798767, "regret_corner": 0.0905996710062027, "regret_row": 0.590372622013092, "regret_any": 0.7610601782798767, "regret_bot": 0.7897699475288391, "value_dist": 0.310901403427124, "value_other_env": 0.06849295645952225, "value_corner": 0.6745140552520752, "value_row": 0.2063164860010147, "value_any": 0.06849295645952225, "value_bot": 0.006919149775058031, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00234.png", "entropy": 0.7039541006088257} +{"ts": "2026-01-29T21:30:40.888785Z", "loop": 235, "env_steps": 144384000, "exact_value_avg": 0.31087547540664673, "regret_dist": 0.49290192127227783, "regret_other_env": 0.7610657811164856, "regret_corner": 0.09065606445074081, "regret_row": 0.5911587476730347, "regret_any": 0.7610657811164856, "regret_bot": 0.7897143363952637, "value_dist": 0.31087547540664673, "value_other_env": 0.06848729401826859, "value_corner": 0.6744577288627625, "value_row": 0.20553027093410492, "value_any": 0.06848729401826859, "value_bot": 0.006974739022552967, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00235.png", "entropy": 0.7037924528121948} +{"ts": "2026-01-29T21:30:42.092181Z", "loop": 236, "env_steps": 144998400, "exact_value_avg": 0.31084832549095154, "regret_dist": 0.492929071187973, "regret_other_env": 0.761070966720581, "regret_corner": 0.09071619063615799, "regret_row": 0.5916529297828674, "regret_any": 0.761070966720581, "regret_bot": 0.789679765701294, "value_dist": 0.31084832549095154, "value_other_env": 0.0684821605682373, "value_corner": 0.6743975877761841, "value_row": 0.20503616333007812, "value_any": 0.0684821605682373, "value_bot": 0.007009313907474279, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00236.png", "entropy": 0.703626811504364} +{"ts": "2026-01-29T21:30:43.296314Z", "loop": 237, "env_steps": 145612800, "exact_value_avg": 0.3108481168746948, "regret_dist": 0.49292922019958496, "regret_other_env": 0.761075496673584, "regret_corner": 0.09070980548858643, "regret_row": 0.5917659401893616, "regret_any": 0.761075496673584, "regret_bot": 0.7896732091903687, "value_dist": 0.3108481168746948, "value_other_env": 0.06847760826349258, "value_corner": 0.6744039058685303, "value_row": 0.20492315292358398, "value_any": 0.06847760826349258, "value_bot": 0.007015945389866829, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00237.png", "entropy": 0.7034218311309814} +{"ts": "2026-01-29T21:30:44.500265Z", "loop": 238, "env_steps": 146227200, "exact_value_avg": 0.3108288645744324, "regret_dist": 0.4929485619068146, "regret_other_env": 0.761081874370575, "regret_corner": 0.09074849635362625, "regret_row": 0.5922199487686157, "regret_any": 0.761081874370575, "regret_bot": 0.7896417379379272, "value_dist": 0.3108288645744324, "value_other_env": 0.06847123801708221, "value_corner": 0.6743652820587158, "value_row": 0.20446908473968506, "value_any": 0.06847123801708221, "value_bot": 0.00704732583835721, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00238.png", "entropy": 0.7031756043434143} +{"ts": "2026-01-29T21:30:45.713480Z", "loop": 239, "env_steps": 146841600, "exact_value_avg": 0.31079721450805664, "regret_dist": 0.49298012256622314, "regret_other_env": 0.7610895037651062, "regret_corner": 0.09081605821847916, "regret_row": 0.5928357243537903, "regret_any": 0.7610895037651062, "regret_bot": 0.7895985841751099, "value_dist": 0.31079721450805664, "value_other_env": 0.068463534116745, "value_corner": 0.6742976903915405, "value_row": 0.20385335385799408, "value_any": 0.068463534116745, "value_bot": 0.0070904758758842945, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00239.png", "entropy": 0.7028694748878479} +{"ts": "2026-01-29T21:30:46.917140Z", "loop": 240, "env_steps": 147456000, "exact_value_avg": 0.3108202815055847, "regret_dist": 0.49295705556869507, "regret_other_env": 0.7610912919044495, "regret_corner": 0.0907556563615799, "regret_row": 0.592508852481842, "regret_any": 0.7610912919044495, "regret_bot": 0.7896236181259155, "value_dist": 0.3108202815055847, "value_other_env": 0.06846176832914352, "value_corner": 0.674358069896698, "value_row": 0.20418021082878113, "value_any": 0.06846176832914352, "value_bot": 0.007065464276820421, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00240.png", "entropy": 0.7027949690818787} +{"ts": "2026-01-29T21:30:48.124565Z", "loop": 241, "env_steps": 148070400, "exact_value_avg": 0.31087151169776917, "regret_dist": 0.492905855178833, "regret_other_env": 0.7610892653465271, "regret_corner": 0.09063074737787247, "regret_row": 0.5917086601257324, "regret_any": 0.7610892653465271, "regret_bot": 0.7896819114685059, "value_dist": 0.31087151169776917, "value_other_env": 0.06846383213996887, "value_corner": 0.6744830012321472, "value_row": 0.20498034358024597, "value_any": 0.06846383213996887, "value_bot": 0.007007089909166098, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00241.png", "entropy": 0.7027530074119568} +{"ts": "2026-01-29T21:30:49.331450Z", "loop": 242, "env_steps": 148684800, "exact_value_avg": 0.3109378218650818, "regret_dist": 0.49283960461616516, "regret_other_env": 0.7610872387886047, "regret_corner": 0.09046810865402222, "regret_row": 0.5901747941970825, "regret_any": 0.7610872387886047, "regret_bot": 0.7897914052009583, "value_dist": 0.3109378218650818, "value_other_env": 0.06846588850021362, "value_corner": 0.6746456623077393, "value_row": 0.20651419460773468, "value_any": 0.06846588850021362, "value_bot": 0.0068976739421486855, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00242.png", "entropy": 0.7027637362480164} +{"ts": "2026-01-29T21:30:50.534646Z", "loop": 243, "env_steps": 149299200, "exact_value_avg": 0.3109970986843109, "regret_dist": 0.49278029799461365, "regret_other_env": 0.7610819935798645, "regret_corner": 0.09032769501209259, "regret_row": 0.5879088044166565, "regret_any": 0.7610819935798645, "regret_bot": 0.7899507284164429, "value_dist": 0.3109970986843109, "value_other_env": 0.06847112625837326, "value_corner": 0.6747860312461853, "value_row": 0.2087801843881607, "value_any": 0.06847112625837326, "value_bot": 0.006738284137099981, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00243.png", "entropy": 0.7027691006660461} +{"ts": "2026-01-29T21:30:51.738034Z", "loop": 244, "env_steps": 149913600, "exact_value_avg": 0.31099897623062134, "regret_dist": 0.49277839064598083, "regret_other_env": 0.7610831260681152, "regret_corner": 0.09032125771045685, "regret_row": 0.5854372382164001, "regret_any": 0.7610831260681152, "regret_bot": 0.7901207804679871, "value_dist": 0.31099897623062134, "value_other_env": 0.06846996396780014, "value_corner": 0.674792468547821, "value_row": 0.21125179529190063, "value_any": 0.06846996396780014, "value_bot": 0.006568230222910643, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00244.png", "entropy": 0.7025429606437683} +{"ts": "2026-01-29T21:30:52.949332Z", "loop": 245, "env_steps": 150528000, "exact_value_avg": 0.3109275996685028, "regret_dist": 0.49284979701042175, "regret_other_env": 0.7610888481140137, "regret_corner": 0.09049120545387268, "regret_row": 0.5828454494476318, "regret_any": 0.7610888481140137, "regret_bot": 0.7902956604957581, "value_dist": 0.3109275996685028, "value_other_env": 0.06846428662538528, "value_corner": 0.6746225357055664, "value_row": 0.21384356915950775, "value_any": 0.06846428662538528, "value_bot": 0.006393409334123135, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00245.png", "entropy": 0.7020792365074158} +{"ts": "2026-01-29T21:30:54.164768Z", "loop": 246, "env_steps": 151142400, "exact_value_avg": 0.3107905089855194, "regret_dist": 0.49298691749572754, "regret_other_env": 0.7611006498336792, "regret_corner": 0.09081625938415527, "regret_row": 0.5803134441375732, "regret_any": 0.7611006498336792, "regret_bot": 0.7904643416404724, "value_dist": 0.3107905089855194, "value_other_env": 0.06845250725746155, "value_corner": 0.6742975115776062, "value_row": 0.21637558937072754, "value_any": 0.06845250725746155, "value_bot": 0.00622476264834404, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00246.png", "entropy": 0.701405942440033} +{"ts": "2026-01-29T21:30:55.377873Z", "loop": 247, "env_steps": 151756800, "exact_value_avg": 0.3107556998729706, "regret_dist": 0.493021696805954, "regret_other_env": 0.7611061334609985, "regret_corner": 0.09089501947164536, "regret_row": 0.5797067880630493, "regret_any": 0.7611061334609985, "regret_bot": 0.7905037999153137, "value_dist": 0.3107556998729706, "value_other_env": 0.06844699382781982, "value_corner": 0.6742187142372131, "value_row": 0.21698224544525146, "value_any": 0.06844699382781982, "value_bot": 0.006185166072100401, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00247.png", "entropy": 0.7011244297027588} +{"ts": "2026-01-29T21:30:56.583086Z", "loop": 248, "env_steps": 152371200, "exact_value_avg": 0.31079044938087463, "regret_dist": 0.4929869472980499, "regret_other_env": 0.761106550693512, "regret_corner": 0.09080752730369568, "regret_row": 0.5801637172698975, "regret_any": 0.761106550693512, "regret_bot": 0.7904747128486633, "value_dist": 0.31079044938087463, "value_other_env": 0.0684465616941452, "value_corner": 0.6743062734603882, "value_row": 0.21652533113956451, "value_any": 0.0684465616941452, "value_bot": 0.0062143574468791485, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00248.png", "entropy": 0.701129138469696} +{"ts": "2026-01-29T21:30:57.790331Z", "loop": 249, "env_steps": 152985600, "exact_value_avg": 0.31079918146133423, "regret_dist": 0.49297821521759033, "regret_other_env": 0.7611072659492493, "regret_corner": 0.09078454226255417, "regret_row": 0.5803090333938599, "regret_any": 0.7611072659492493, "regret_bot": 0.7904653549194336, "value_dist": 0.31079918146133423, "value_other_env": 0.0684458315372467, "value_corner": 0.6743291616439819, "value_row": 0.21637998521327972, "value_any": 0.0684458315372467, "value_bot": 0.006223691627383232, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00249.png", "entropy": 0.7010976672172546} +{"ts": "2026-01-29T21:30:59.001150Z", "loop": 250, "env_steps": 153600000, "exact_value_avg": 0.31087446212768555, "regret_dist": 0.4929029047489166, "regret_other_env": 0.7611056566238403, "regret_corner": 0.09059876948595047, "regret_row": 0.5814791321754456, "regret_any": 0.7611056566238403, "regret_bot": 0.7903885841369629, "value_dist": 0.31087446212768555, "value_other_env": 0.06844743341207504, "value_corner": 0.6745149493217468, "value_row": 0.21520988643169403, "value_any": 0.06844743341207504, "value_bot": 0.006300423759967089, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00250.png", "entropy": 0.701309859752655} +{"ts": "2026-01-29T21:31:01.364853Z", "loop": 252, "env_steps": 154828800, "exact_value_avg": 0.3110257387161255, "regret_dist": 0.4927516579627991, "regret_other_env": 0.7611015439033508, "regret_corner": 0.09022674709558487, "regret_row": 0.5858551859855652, "regret_any": 0.7611015439033508, "regret_bot": 0.7900964617729187, "value_dist": 0.3110257387161255, "value_other_env": 0.06845156848430634, "value_corner": 0.6748870015144348, "value_row": 0.2108338475227356, "value_any": 0.06845156848430634, "value_bot": 0.006592629011720419, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00252.png", "entropy": 0.7017640471458435} +{"ts": "2026-01-29T21:31:03.742957Z", "loop": 254, "env_steps": 156057600, "exact_value_avg": 0.3109700381755829, "regret_dist": 0.49280738830566406, "regret_other_env": 0.7611180543899536, "regret_corner": 0.09034133702516556, "regret_row": 0.5904850363731384, "regret_any": 0.7611180543899536, "regret_bot": 0.7897780537605286, "value_dist": 0.3109700381755829, "value_other_env": 0.06843505054712296, "value_corner": 0.6747724413871765, "value_row": 0.20620393753051758, "value_any": 0.06843505054712296, "value_bot": 0.006911046337336302, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00254.png", "entropy": 0.7013189196586609} +{"ts": "2026-01-29T21:31:06.123334Z", "loop": 256, "env_steps": 157286400, "exact_value_avg": 0.3107217848300934, "regret_dist": 0.4930555522441864, "regret_other_env": 0.761150062084198, "regret_corner": 0.0909137949347496, "regret_row": 0.5946539640426636, "regret_any": 0.761150062084198, "regret_bot": 0.7894815802574158, "value_dist": 0.3107217848300934, "value_other_env": 0.06840301305055618, "value_corner": 0.6741998791694641, "value_row": 0.2020350694656372, "value_any": 0.06840301305055618, "value_bot": 0.007207473739981651, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00256.png", "entropy": 0.7002149820327759} +{"ts": "2026-01-29T21:31:08.495753Z", "loop": 258, "env_steps": 158515200, "exact_value_avg": 0.31073224544525146, "regret_dist": 0.4930451512336731, "regret_other_env": 0.7611555457115173, "regret_corner": 0.09087949246168137, "regret_row": 0.5946437120437622, "regret_any": 0.7611555457115173, "regret_bot": 0.7894839644432068, "value_dist": 0.31073224544525146, "value_other_env": 0.06839754432439804, "value_corner": 0.6742342114448547, "value_row": 0.20204536616802216, "value_any": 0.06839754432439804, "value_bot": 0.007205038797110319, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00258.png", "entropy": 0.6999337673187256} +{"ts": "2026-01-29T21:31:10.858091Z", "loop": 260, "env_steps": 159744000, "exact_value_avg": 0.31090012192726135, "regret_dist": 0.4928772747516632, "regret_other_env": 0.7611437439918518, "regret_corner": 0.09047756344079971, "regret_row": 0.5923211574554443, "regret_any": 0.7611437439918518, "regret_bot": 0.7896521091461182, "value_dist": 0.31090012192726135, "value_other_env": 0.06840938329696655, "value_corner": 0.67463618516922, "value_row": 0.20436789095401764, "value_any": 0.06840938329696655, "value_bot": 0.007037017494440079, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00260.png", "entropy": 0.7002914547920227} +{"ts": "2026-01-29T21:31:13.228847Z", "loop": 262, "env_steps": 160972800, "exact_value_avg": 0.31100696325302124, "regret_dist": 0.49277040362358093, "regret_other_env": 0.7611406445503235, "regret_corner": 0.09021499007940292, "regret_row": 0.5901787877082825, "regret_any": 0.7611406445503235, "regret_bot": 0.7898048162460327, "value_dist": 0.31100696325302124, "value_other_env": 0.06841246783733368, "value_corner": 0.6748986840248108, "value_row": 0.2065102905035019, "value_any": 0.06841246783733368, "value_bot": 0.006884293630719185, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00262.png", "entropy": 0.7003693580627441} +{"ts": "2026-01-29T21:31:15.593223Z", "loop": 264, "env_steps": 162201600, "exact_value_avg": 0.3110756278038025, "regret_dist": 0.4927017390727997, "regret_other_env": 0.7611387372016907, "regret_corner": 0.09004624933004379, "regret_row": 0.5869619250297546, "regret_any": 0.7611387372016907, "regret_bot": 0.7900293469429016, "value_dist": 0.3110756278038025, "value_other_env": 0.0684143677353859, "value_corner": 0.6750674843788147, "value_row": 0.20972712337970734, "value_any": 0.0684143677353859, "value_bot": 0.006659746170043945, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00264.png", "entropy": 0.7002117037773132} +{"ts": "2026-01-29T21:31:17.962897Z", "loop": 266, "env_steps": 163430400, "exact_value_avg": 0.3110702931880951, "regret_dist": 0.49270713329315186, "regret_other_env": 0.7611384987831116, "regret_corner": 0.09006001055240631, "regret_row": 0.5857195258140564, "regret_any": 0.7611384987831116, "regret_bot": 0.7901137471199036, "value_dist": 0.3110702931880951, "value_other_env": 0.06841464340686798, "value_corner": 0.6750537157058716, "value_row": 0.2109694927930832, "value_any": 0.06841464340686798, "value_bot": 0.006575244478881359, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00266.png", "entropy": 0.6999965310096741} +{"ts": "2026-01-29T21:31:20.330376Z", "loop": 268, "env_steps": 164659200, "exact_value_avg": 0.3110831379890442, "regret_dist": 0.49269425868988037, "regret_other_env": 0.7611415982246399, "regret_corner": 0.0900232344865799, "regret_row": 0.5865128636360168, "regret_any": 0.7611415982246399, "regret_bot": 0.7900612354278564, "value_dist": 0.3110831379890442, "value_other_env": 0.06841155886650085, "value_corner": 0.675090491771698, "value_row": 0.21017615497112274, "value_any": 0.06841155886650085, "value_bot": 0.0066277687437832355, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00268.png", "entropy": 0.6998156309127808} +{"ts": "2026-01-29T21:31:22.691445Z", "loop": 270, "env_steps": 165888000, "exact_value_avg": 0.3110862374305725, "regret_dist": 0.4926910996437073, "regret_other_env": 0.7611455917358398, "regret_corner": 0.09000936150550842, "regret_row": 0.5873317718505859, "regret_any": 0.7611455917358398, "regret_bot": 0.7900058627128601, "value_dist": 0.3110862374305725, "value_other_env": 0.06840747594833374, "value_corner": 0.6751043200492859, "value_row": 0.20935726165771484, "value_any": 0.06840747594833374, "value_bot": 0.006683246232569218, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00270.png", "entropy": 0.6995744109153748} +{"ts": "2026-01-29T21:31:25.052290Z", "loop": 272, "env_steps": 167116800, "exact_value_avg": 0.31107819080352783, "regret_dist": 0.49269920587539673, "regret_other_env": 0.7611470818519592, "regret_corner": 0.09002738445997238, "regret_row": 0.585002064704895, "regret_any": 0.7611470818519592, "regret_bot": 0.7901662588119507, "value_dist": 0.31107819080352783, "value_other_env": 0.06840605288743973, "value_corner": 0.6750863790512085, "value_row": 0.21168692409992218, "value_any": 0.06840605288743973, "value_bot": 0.006522854790091515, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00272.png", "entropy": 0.6992538571357727} +{"ts": "2026-01-29T21:31:27.414667Z", "loop": 274, "env_steps": 168345600, "exact_value_avg": 0.3110034763813019, "regret_dist": 0.4927738606929779, "regret_other_env": 0.761155903339386, "regret_corner": 0.09020078182220459, "regret_row": 0.5825346112251282, "regret_any": 0.761155903339386, "regret_bot": 0.7903329133987427, "value_dist": 0.3110034763813019, "value_other_env": 0.0683971717953682, "value_corner": 0.6749129295349121, "value_row": 0.2141544669866562, "value_any": 0.0683971717953682, "value_bot": 0.006356183439493179, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00274.png", "entropy": 0.6988111734390259} +{"ts": "2026-01-29T21:31:29.794187Z", "loop": 276, "env_steps": 169574400, "exact_value_avg": 0.31088000535964966, "regret_dist": 0.4928974211215973, "regret_other_env": 0.7611674070358276, "regret_corner": 0.09049239754676819, "regret_row": 0.5803828239440918, "regret_any": 0.7611674070358276, "regret_bot": 0.7904747724533081, "value_dist": 0.31088000535964966, "value_other_env": 0.06838574260473251, "value_corner": 0.6746213436126709, "value_row": 0.21630622446537018, "value_any": 0.06838574260473251, "value_bot": 0.006214245688170195, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00276.png", "entropy": 0.698291540145874} +{"ts": "2026-01-29T21:31:32.165564Z", "loop": 278, "env_steps": 170803200, "exact_value_avg": 0.3108937442302704, "regret_dist": 0.4928836524486542, "regret_other_env": 0.7611716985702515, "regret_corner": 0.09045156836509705, "regret_row": 0.5806169509887695, "regret_any": 0.7611716985702515, "regret_bot": 0.7904601097106934, "value_dist": 0.3108937442302704, "value_other_env": 0.0683814287185669, "value_corner": 0.674662172794342, "value_row": 0.21607202291488647, "value_any": 0.0683814287185669, "value_bot": 0.006228998769074678, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00278.png", "entropy": 0.6982965469360352} +{"ts": "2026-01-29T21:31:34.527928Z", "loop": 280, "env_steps": 172032000, "exact_value_avg": 0.3110533058643341, "regret_dist": 0.49272409081459045, "regret_other_env": 0.761163055896759, "regret_corner": 0.09006557613611221, "regret_row": 0.5836919546127319, "regret_any": 0.761163055896759, "regret_bot": 0.790257453918457, "value_dist": 0.3110533058643341, "value_other_env": 0.06839004904031754, "value_corner": 0.6750481724739075, "value_row": 0.21299712359905243, "value_any": 0.06839004904031754, "value_bot": 0.006431549787521362, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00280.png", "entropy": 0.698846697807312} +{"ts": "2026-01-29T21:31:36.894837Z", "loop": 282, "env_steps": 173260800, "exact_value_avg": 0.3110710382461548, "regret_dist": 0.4927063584327698, "regret_other_env": 0.7611680626869202, "regret_corner": 0.0900137647986412, "regret_row": 0.5894480347633362, "regret_any": 0.7611680626869202, "regret_bot": 0.7898664474487305, "value_dist": 0.3110710382461548, "value_other_env": 0.0683850646018982, "value_corner": 0.6750999689102173, "value_row": 0.2072409838438034, "value_any": 0.0683850646018982, "value_bot": 0.006822500377893448, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00282.png", "entropy": 0.6990195512771606} +{"ts": "2026-01-29T21:31:39.263323Z", "loop": 284, "env_steps": 174489600, "exact_value_avg": 0.31082212924957275, "regret_dist": 0.4929552674293518, "regret_other_env": 0.7611916661262512, "regret_corner": 0.0906006395816803, "regret_row": 0.5941298604011536, "regret_any": 0.7611916661262512, "regret_bot": 0.7895340919494629, "value_dist": 0.31082212924957275, "value_other_env": 0.06836143881082535, "value_corner": 0.6745131015777588, "value_row": 0.2025591880083084, "value_any": 0.06836143881082535, "value_bot": 0.007154899649322033, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00284.png", "entropy": 0.6982830762863159} +{"ts": "2026-01-29T21:31:41.627881Z", "loop": 286, "env_steps": 175718400, "exact_value_avg": 0.3104250133037567, "regret_dist": 0.49335235357284546, "regret_other_env": 0.7612274289131165, "regret_corner": 0.09153970330953598, "regret_row": 0.5982102751731873, "regret_any": 0.7612274289131165, "regret_bot": 0.7892340421676636, "value_dist": 0.3104250133037567, "value_other_env": 0.0683256983757019, "value_corner": 0.6735739707946777, "value_row": 0.1984788328409195, "value_any": 0.0683256983757019, "value_bot": 0.007455052342265844, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00286.png", "entropy": 0.6970426440238953} +{"ts": "2026-01-29T21:31:43.991022Z", "loop": 288, "env_steps": 176947200, "exact_value_avg": 0.31070587038993835, "regret_dist": 0.4930715262889862, "regret_other_env": 0.7612022757530212, "regret_corner": 0.09087533503770828, "regret_row": 0.5955396890640259, "regret_any": 0.7612022757530212, "regret_bot": 0.7894312739372253, "value_dist": 0.31070587038993835, "value_other_env": 0.06835082173347473, "value_corner": 0.674238383769989, "value_row": 0.20114929974079132, "value_any": 0.06835082173347473, "value_bot": 0.007257798220962286, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00288.png", "entropy": 0.6980194449424744} +{"ts": "2026-01-29T21:31:46.355998Z", "loop": 290, "env_steps": 178176000, "exact_value_avg": 0.3110867738723755, "regret_dist": 0.4926905930042267, "regret_other_env": 0.7611624598503113, "regret_corner": 0.08998275548219681, "regret_row": 0.5885677933692932, "regret_any": 0.7611624598503113, "regret_bot": 0.7899260520935059, "value_dist": 0.3110867738723755, "value_other_env": 0.0683906227350235, "value_corner": 0.6751310229301453, "value_row": 0.20812126994132996, "value_any": 0.0683906227350235, "value_bot": 0.006762981880456209, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00290.png", "entropy": 0.6992409825325012} +{"ts": "2026-01-29T21:31:48.714629Z", "loop": 292, "env_steps": 179404800, "exact_value_avg": 0.31092461943626404, "regret_dist": 0.4928527772426605, "regret_other_env": 0.7611666917800903, "regret_corner": 0.09038188308477402, "regret_row": 0.5811353325843811, "regret_any": 0.7611666917800903, "regret_bot": 0.7904272675514221, "value_dist": 0.31092461943626404, "value_other_env": 0.06838642805814743, "value_corner": 0.6747318506240845, "value_row": 0.21555368602275848, "value_any": 0.06838642805814743, "value_bot": 0.006261791568249464, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00292.png", "entropy": 0.6985171437263489} +{"ts": "2026-01-29T21:31:51.076547Z", "loop": 294, "env_steps": 180633600, "exact_value_avg": 0.31047749519348145, "regret_dist": 0.4932999014854431, "regret_other_env": 0.7611972689628601, "regret_corner": 0.09145376086235046, "regret_row": 0.5760524272918701, "regret_any": 0.7611972689628601, "regret_bot": 0.7907557487487793, "value_dist": 0.31047749519348145, "value_other_env": 0.06835586577653885, "value_corner": 0.6736599206924438, "value_row": 0.22063665091991425, "value_any": 0.06835586577653885, "value_bot": 0.005933346692472696, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00294.png", "entropy": 0.6968591809272766} +{"ts": "2026-01-29T21:31:53.438388Z", "loop": 296, "env_steps": 181862400, "exact_value_avg": 0.31020134687423706, "regret_dist": 0.4935760200023651, "regret_other_env": 0.7612181305885315, "regret_corner": 0.09211282432079315, "regret_row": 0.5739287734031677, "regret_any": 0.7612181305885315, "regret_bot": 0.790890634059906, "value_dist": 0.31020134687423706, "value_other_env": 0.06833498179912567, "value_corner": 0.6730008721351624, "value_row": 0.22276027500629425, "value_any": 0.06833498179912567, "value_bot": 0.005798389669507742, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00296.png", "entropy": 0.6958884596824646} +{"ts": "2026-01-29T21:31:55.799584Z", "loop": 298, "env_steps": 183091200, "exact_value_avg": 0.31059759855270386, "regret_dist": 0.4931797981262207, "regret_other_env": 0.7611886858940125, "regret_corner": 0.0911664217710495, "regret_row": 0.5771807432174683, "regret_any": 0.7611886858940125, "regret_bot": 0.7906843423843384, "value_dist": 0.31059759855270386, "value_other_env": 0.06836444139480591, "value_corner": 0.6739473342895508, "value_row": 0.2195083051919937, "value_any": 0.06836444139480591, "value_bot": 0.00600470183417201, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00298.png", "entropy": 0.6973983645439148} +{"ts": "2026-01-29T21:31:58.166776Z", "loop": 300, "env_steps": 184320000, "exact_value_avg": 0.31088122725486755, "regret_dist": 0.49289608001708984, "regret_other_env": 0.7611702084541321, "regret_corner": 0.0904848501086235, "regret_row": 0.5804325938224792, "regret_any": 0.7611702084541321, "regret_bot": 0.7904729247093201, "value_dist": 0.31088122725486755, "value_other_env": 0.06838282942771912, "value_corner": 0.6746288537979126, "value_row": 0.21625646948814392, "value_any": 0.06838282942771912, "value_bot": 0.00621608505025506, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00300.png", "entropy": 0.698466956615448} +{"ts": "2026-01-29T21:32:00.537919Z", "loop": 302, "env_steps": 185548800, "exact_value_avg": 0.3110977113246918, "regret_dist": 0.4926796555519104, "regret_other_env": 0.7611570358276367, "regret_corner": 0.08996350318193436, "regret_row": 0.5862244367599487, "regret_any": 0.7611570358276367, "regret_bot": 0.7900859117507935, "value_dist": 0.3110977113246918, "value_other_env": 0.06839597970247269, "value_corner": 0.6751502752304077, "value_row": 0.21046461164951324, "value_any": 0.06839597970247269, "value_bot": 0.006603101268410683, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00302.png", "entropy": 0.6994071006774902} +{"ts": "2026-01-29T21:32:02.901699Z", "loop": 304, "env_steps": 186777600, "exact_value_avg": 0.3109879195690155, "regret_dist": 0.49278947710990906, "regret_other_env": 0.7611701488494873, "regret_corner": 0.0902184247970581, "regret_row": 0.5915204882621765, "regret_any": 0.7611701488494873, "regret_bot": 0.7897181510925293, "value_dist": 0.3109879195690155, "value_other_env": 0.06838291883468628, "value_corner": 0.6748954057693481, "value_row": 0.20516856014728546, "value_any": 0.06838291883468628, "value_bot": 0.006970890332013369, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00304.png", "entropy": 0.6991634964942932} +{"ts": "2026-01-29T21:32:05.269395Z", "loop": 306, "env_steps": 188006400, "exact_value_avg": 0.3107392191886902, "regret_dist": 0.4930381774902344, "regret_other_env": 0.761194109916687, "regret_corner": 0.09080421924591064, "regret_row": 0.5951521992683411, "regret_any": 0.761194109916687, "regret_bot": 0.7894564270973206, "value_dist": 0.3107392191886902, "value_other_env": 0.06835895776748657, "value_corner": 0.6743095517158508, "value_row": 0.2015368491411209, "value_any": 0.06835895776748657, "value_bot": 0.007232608739286661, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00306.png", "entropy": 0.6984403729438782} +{"ts": "2026-01-29T21:32:07.633372Z", "loop": 308, "env_steps": 189235200, "exact_value_avg": 0.3105965852737427, "regret_dist": 0.4931808412075043, "regret_other_env": 0.7612085938453674, "regret_corner": 0.09113917499780655, "regret_row": 0.5966700315475464, "regret_any": 0.7612085938453674, "regret_bot": 0.7893449068069458, "value_dist": 0.3105965852737427, "value_other_env": 0.06834457814693451, "value_corner": 0.6739745736122131, "value_row": 0.2000190019607544, "value_any": 0.06834457814693451, "value_bot": 0.007344161160290241, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00308.png", "entropy": 0.6979557871818542} +{"ts": "2026-01-29T21:32:09.995290Z", "loop": 310, "env_steps": 190464000, "exact_value_avg": 0.31029799580574036, "regret_dist": 0.4934794008731842, "regret_other_env": 0.7612377405166626, "regret_corner": 0.09184183180332184, "regret_row": 0.5992461442947388, "regret_any": 0.7612377405166626, "regret_bot": 0.7891529202461243, "value_dist": 0.31029799580574036, "value_other_env": 0.06831536442041397, "value_corner": 0.673271894454956, "value_row": 0.19744287431240082, "value_any": 0.06831536442041397, "value_bot": 0.007536186370998621, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00310.png", "entropy": 0.696871280670166} +{"ts": "2026-01-29T21:32:12.359475Z", "loop": 312, "env_steps": 191692800, "exact_value_avg": 0.3104417026042938, "regret_dist": 0.49333566427230835, "regret_other_env": 0.7612295150756836, "regret_corner": 0.0914948582649231, "regret_row": 0.5981468558311462, "regret_any": 0.7612295150756836, "regret_bot": 0.7892361283302307, "value_dist": 0.3104417026042938, "value_other_env": 0.06832359731197357, "value_corner": 0.6736188530921936, "value_row": 0.19854220747947693, "value_any": 0.06832359731197357, "value_bot": 0.007452936377376318, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00312.png", "entropy": 0.697199821472168} +{"ts": "2026-01-29T21:32:14.723768Z", "loop": 314, "env_steps": 192921600, "exact_value_avg": 0.31096184253692627, "regret_dist": 0.4928155541419983, "regret_other_env": 0.7611861824989319, "regret_corner": 0.09025957435369492, "regret_row": 0.5921863317489624, "regret_any": 0.7611861824989319, "regret_bot": 0.7896727323532104, "value_dist": 0.31096184253692627, "value_other_env": 0.06836695969104767, "value_corner": 0.6748541593551636, "value_row": 0.204502671957016, "value_any": 0.06836695969104767, "value_bot": 0.007016309071332216, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00314.png", "entropy": 0.6986784338951111} +{"ts": "2026-01-29T21:32:17.092494Z", "loop": 316, "env_steps": 194150400, "exact_value_avg": 0.3111073970794678, "regret_dist": 0.4926700294017792, "regret_other_env": 0.7611714601516724, "regret_corner": 0.08991783857345581, "regret_row": 0.5852473378181458, "regret_any": 0.7611714601516724, "regret_bot": 0.7901546359062195, "value_dist": 0.3111073970794678, "value_other_env": 0.06838170439004898, "value_corner": 0.6751958727836609, "value_row": 0.21144171059131622, "value_any": 0.06838170439004898, "value_bot": 0.0065343924798071384, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00316.png", "entropy": 0.6987730860710144} +{"ts": "2026-01-29T21:32:19.457364Z", "loop": 318, "env_steps": 195379200, "exact_value_avg": 0.3108115494251251, "regret_dist": 0.49296584725379944, "regret_other_env": 0.7611942291259766, "regret_corner": 0.09062317758798599, "regret_row": 0.5791851878166199, "regret_any": 0.7611942291259766, "regret_bot": 0.7905575633049011, "value_dist": 0.3108115494251251, "value_other_env": 0.06835886090993881, "value_corner": 0.6744905710220337, "value_row": 0.2175038605928421, "value_any": 0.06835886090993881, "value_bot": 0.00613147160038352, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00318.png", "entropy": 0.6973797678947449} +{"ts": "2026-01-29T21:32:21.831400Z", "loop": 320, "env_steps": 196608000, "exact_value_avg": 0.3104967772960663, "regret_dist": 0.4932805895805359, "regret_other_env": 0.7612192034721375, "regret_corner": 0.09137268364429474, "regret_row": 0.5760562419891357, "regret_any": 0.7612192034721375, "regret_bot": 0.7907590866088867, "value_dist": 0.3104967772960663, "value_other_env": 0.0683339461684227, "value_corner": 0.6737410426139832, "value_row": 0.22063280642032623, "value_any": 0.0683339461684227, "value_bot": 0.005929944105446339, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00320.png", "entropy": 0.6961113810539246} +{"ts": "2026-01-29T21:32:24.194047Z", "loop": 322, "env_steps": 197836800, "exact_value_avg": 0.3109387755393982, "regret_dist": 0.492838591337204, "regret_other_env": 0.7611888647079468, "regret_corner": 0.09031309187412262, "regret_row": 0.5809139013290405, "regret_any": 0.7611888647079468, "regret_bot": 0.790445864200592, "value_dist": 0.3109387755393982, "value_other_env": 0.0683642029762268, "value_corner": 0.6748006343841553, "value_row": 0.21577517688274384, "value_any": 0.0683642029762268, "value_bot": 0.0062432000413537025, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00322.png", "entropy": 0.6977081894874573} +{"ts": "2026-01-29T21:32:26.563685Z", "loop": 324, "env_steps": 199065600, "exact_value_avg": 0.311119019985199, "regret_dist": 0.4926583468914032, "regret_other_env": 0.7611806988716125, "regret_corner": 0.08987478166818619, "regret_row": 0.5883103013038635, "regret_any": 0.7611806988716125, "regret_bot": 0.7899489402770996, "value_dist": 0.311119019985199, "value_other_env": 0.06837240606546402, "value_corner": 0.6752389669418335, "value_row": 0.20837876200675964, "value_any": 0.06837240606546402, "value_bot": 0.00674009881913662, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00324.png", "entropy": 0.6985104084014893} +{"ts": "2026-01-29T21:32:28.929108Z", "loop": 326, "env_steps": 200294400, "exact_value_avg": 0.3109239637851715, "regret_dist": 0.49285343289375305, "regret_other_env": 0.7612010836601257, "regret_corner": 0.09033188223838806, "regret_row": 0.5930714011192322, "regret_any": 0.7612010836601257, "regret_bot": 0.7896149158477783, "value_dist": 0.3109239637851715, "value_other_env": 0.06835200637578964, "value_corner": 0.674781858921051, "value_row": 0.2036176174879074, "value_any": 0.06835200637578964, "value_bot": 0.007074197754263878, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00326.png", "entropy": 0.6979390382766724} +{"ts": "2026-01-29T21:32:31.298971Z", "loop": 328, "env_steps": 201523200, "exact_value_avg": 0.31085509061813354, "regret_dist": 0.4929223358631134, "regret_other_env": 0.7612107396125793, "regret_corner": 0.0904897004365921, "regret_row": 0.5941191911697388, "regret_any": 0.7612107396125793, "regret_bot": 0.7895389199256897, "value_dist": 0.31085509061813354, "value_other_env": 0.06834243983030319, "value_corner": 0.6746240258216858, "value_row": 0.2025698572397232, "value_any": 0.06834243983030319, "value_bot": 0.007150211837142706, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00328.png", "entropy": 0.6976834535598755} +{"ts": "2026-01-29T21:32:33.674895Z", "loop": 330, "env_steps": 202752000, "exact_value_avg": 0.31089991331100464, "regret_dist": 0.4928774833679199, "regret_other_env": 0.7612063884735107, "regret_corner": 0.09038407355546951, "regret_row": 0.5935487747192383, "regret_any": 0.7612063884735107, "regret_bot": 0.7895801663398743, "value_dist": 0.31089991331100464, "value_other_env": 0.06834669411182404, "value_corner": 0.6747297048568726, "value_row": 0.20314030349254608, "value_any": 0.06834669411182404, "value_bot": 0.007108887657523155, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00330.png", "entropy": 0.6978038549423218} +{"ts": "2026-01-29T21:32:36.044645Z", "loop": 332, "env_steps": 203980800, "exact_value_avg": 0.31108152866363525, "regret_dist": 0.4926958680152893, "regret_other_env": 0.7611892223358154, "regret_corner": 0.08995576202869415, "regret_row": 0.5900035500526428, "regret_any": 0.7611892223358154, "regret_bot": 0.7898313403129578, "value_dist": 0.31108152866363525, "value_other_env": 0.06836389750242233, "value_corner": 0.6751579642295837, "value_row": 0.20668542385101318, "value_any": 0.06836389750242233, "value_bot": 0.006857766304165125, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00332.png", "entropy": 0.6983187794685364} +{"ts": "2026-01-29T21:32:38.404918Z", "loop": 334, "env_steps": 205209600, "exact_value_avg": 0.3111058175563812, "regret_dist": 0.49267154932022095, "regret_other_env": 0.7611809968948364, "regret_corner": 0.08990732580423355, "regret_row": 0.5843791365623474, "regret_any": 0.7611809968948364, "regret_bot": 0.7902163863182068, "value_dist": 0.3111058175563812, "value_other_env": 0.06837210804224014, "value_corner": 0.6752064228057861, "value_row": 0.21230991184711456, "value_any": 0.06837210804224014, "value_bot": 0.006472663022577763, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00334.png", "entropy": 0.6982447504997253} +{"ts": "2026-01-29T21:32:40.770803Z", "loop": 336, "env_steps": 206438400, "exact_value_avg": 0.31086838245391846, "regret_dist": 0.4929090142250061, "regret_other_env": 0.7611952424049377, "regret_corner": 0.09047964960336685, "regret_row": 0.5797527432441711, "regret_any": 0.7611952424049377, "regret_bot": 0.7905230522155762, "value_dist": 0.31086838245391846, "value_other_env": 0.06835786253213882, "value_corner": 0.6746340990066528, "value_row": 0.21693626046180725, "value_any": 0.06835786253213882, "value_bot": 0.006165946368128061, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00336.png", "entropy": 0.6973106861114502} +{"ts": "2026-01-29T21:32:43.136767Z", "loop": 338, "env_steps": 207667200, "exact_value_avg": 0.3107219636440277, "regret_dist": 0.49305543303489685, "regret_other_env": 0.7612050771713257, "regret_corner": 0.09083095192909241, "regret_row": 0.578060507774353, "regret_any": 0.7612050771713257, "regret_bot": 0.7906309962272644, "value_dist": 0.3107219636440277, "value_other_env": 0.06834804266691208, "value_corner": 0.6742827892303467, "value_row": 0.21862857043743134, "value_any": 0.06834804266691208, "value_bot": 0.006058048456907272, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00338.png", "entropy": 0.6968336701393127} +{"ts": "2026-01-29T21:32:45.497781Z", "loop": 340, "env_steps": 208896000, "exact_value_avg": 0.3110041618347168, "regret_dist": 0.492773175239563, "regret_other_env": 0.7611833214759827, "regret_corner": 0.0901578739285469, "regret_row": 0.5818696618080139, "regret_any": 0.7611833214759827, "regret_bot": 0.7903832197189331, "value_dist": 0.3110041618347168, "value_other_env": 0.0683697760105133, "value_corner": 0.6749557852745056, "value_row": 0.21481940150260925, "value_any": 0.0683697760105133, "value_bot": 0.006305747665464878, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00340.png", "entropy": 0.6979807019233704} +{"ts": "2026-01-29T21:32:47.862184Z", "loop": 342, "env_steps": 210124800, "exact_value_avg": 0.3111284375190735, "regret_dist": 0.4926488995552063, "regret_other_env": 0.7611762881278992, "regret_corner": 0.08985782414674759, "regret_row": 0.5877179503440857, "regret_any": 0.7611762881278992, "regret_bot": 0.7899906039237976, "value_dist": 0.3111284375190735, "value_other_env": 0.06837683171033859, "value_corner": 0.6752558946609497, "value_row": 0.20897109806537628, "value_any": 0.06837683171033859, "value_bot": 0.0066983927972614765, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00342.png", "entropy": 0.6986364722251892} +{"ts": "2026-01-29T21:32:50.230303Z", "loop": 344, "env_steps": 211353600, "exact_value_avg": 0.3110505938529968, "regret_dist": 0.4927268326282501, "regret_other_env": 0.7611839771270752, "regret_corner": 0.09004110097885132, "regret_row": 0.5908191204071045, "regret_any": 0.7611839771270752, "regret_bot": 0.7897760272026062, "value_dist": 0.3110505938529968, "value_other_env": 0.06836919486522675, "value_corner": 0.6750726699829102, "value_row": 0.20586998760700226, "value_any": 0.06836919486522675, "value_bot": 0.006913111079484224, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00344.png", "entropy": 0.6984601020812988} +{"ts": "2026-01-29T21:32:52.591363Z", "loop": 346, "env_steps": 212582400, "exact_value_avg": 0.3110106587409973, "regret_dist": 0.49276676774024963, "regret_other_env": 0.7611909508705139, "regret_corner": 0.09013041108846664, "regret_row": 0.5917003154754639, "regret_any": 0.7611909508705139, "regret_bot": 0.7897131443023682, "value_dist": 0.3110106587409973, "value_other_env": 0.06836214661598206, "value_corner": 0.6749833822250366, "value_row": 0.20498880743980408, "value_any": 0.06836214661598206, "value_bot": 0.006975943222641945, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00346.png", "entropy": 0.6983620524406433} +{"ts": "2026-01-29T21:32:54.957056Z", "loop": 348, "env_steps": 213811200, "exact_value_avg": 0.31106334924697876, "regret_dist": 0.4927140474319458, "regret_other_env": 0.7611887454986572, "regret_corner": 0.09000199288129807, "regret_row": 0.5906669497489929, "regret_any": 0.7611887454986572, "regret_bot": 0.7897858619689941, "value_dist": 0.31106334924697876, "value_other_env": 0.06836437433958054, "value_corner": 0.6751117706298828, "value_row": 0.20602209866046906, "value_any": 0.06836437433958054, "value_bot": 0.006903169211000204, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00348.png", "entropy": 0.6984041929244995} +{"ts": "2026-01-29T21:32:57.318303Z", "loop": 350, "env_steps": 215040000, "exact_value_avg": 0.3111288249492645, "regret_dist": 0.49264851212501526, "regret_other_env": 0.7611847519874573, "regret_corner": 0.08984408527612686, "regret_row": 0.5885877013206482, "regret_any": 0.7611847519874573, "regret_bot": 0.7899314761161804, "value_dist": 0.3111288249492645, "value_other_env": 0.0683683305978775, "value_corner": 0.675269603729248, "value_row": 0.2081013023853302, "value_any": 0.0683683305978775, "value_bot": 0.0067575909197330475, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00350.png", "entropy": 0.6984243392944336} +{"ts": "2026-01-29T21:32:59.681013Z", "loop": 352, "env_steps": 216268800, "exact_value_avg": 0.3111453354358673, "regret_dist": 0.49263209104537964, "regret_other_env": 0.7611871957778931, "regret_corner": 0.0897994190454483, "regret_row": 0.5866342782974243, "regret_any": 0.7611871957778931, "regret_bot": 0.7900662422180176, "value_dist": 0.3111453354358673, "value_other_env": 0.06836597621440887, "value_corner": 0.6753143668174744, "value_row": 0.21005472540855408, "value_any": 0.06836597621440887, "value_bot": 0.006622875574976206, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00352.png", "entropy": 0.6982880234718323} +{"ts": "2026-01-29T21:33:02.053701Z", "loop": 354, "env_steps": 217497600, "exact_value_avg": 0.3110654354095459, "regret_dist": 0.4927119314670563, "regret_other_env": 0.761191189289093, "regret_corner": 0.08999304473400116, "regret_row": 0.5829448103904724, "regret_any": 0.761191189289093, "regret_bot": 0.7903149724006653, "value_dist": 0.3110654354095459, "value_other_env": 0.06836190074682236, "value_corner": 0.6751207113265991, "value_row": 0.21374423801898956, "value_any": 0.06836190074682236, "value_bot": 0.006374116986989975, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00354.png", "entropy": 0.6978251934051514} +{"ts": "2026-01-29T21:33:04.431665Z", "loop": 356, "env_steps": 218726400, "exact_value_avg": 0.31095564365386963, "regret_dist": 0.49282175302505493, "regret_other_env": 0.7611987590789795, "regret_corner": 0.0902562215924263, "regret_row": 0.5808348655700684, "regret_any": 0.7611987590789795, "regret_bot": 0.7904552817344666, "value_dist": 0.31095564365386963, "value_other_env": 0.06835439056158066, "value_corner": 0.674857497215271, "value_row": 0.21585415303707123, "value_any": 0.06835439056158066, "value_bot": 0.0062337396666407585, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00356.png", "entropy": 0.6973291635513306} +{"ts": "2026-01-29T21:33:06.803697Z", "loop": 358, "env_steps": 219955200, "exact_value_avg": 0.3109707534313202, "regret_dist": 0.49280664324760437, "regret_other_env": 0.7611995339393616, "regret_corner": 0.09021726250648499, "regret_row": 0.5810062289237976, "regret_any": 0.7611995339393616, "regret_bot": 0.7904446721076965, "value_dist": 0.3109707534313202, "value_other_env": 0.0683535560965538, "value_corner": 0.6748965382575989, "value_row": 0.21568287909030914, "value_any": 0.0683535560965538, "value_bot": 0.00624443031847477, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00358.png", "entropy": 0.6972758769989014} +{"ts": "2026-01-29T21:33:09.167160Z", "loop": 360, "env_steps": 221184000, "exact_value_avg": 0.3110537827014923, "regret_dist": 0.49272361397743225, "regret_other_env": 0.761197030544281, "regret_corner": 0.09001344442367554, "regret_row": 0.5824898481369019, "regret_any": 0.761197030544281, "regret_bot": 0.7903470993041992, "value_dist": 0.3110537827014923, "value_other_env": 0.06835610419511795, "value_corner": 0.6751003265380859, "value_row": 0.2141992151737213, "value_any": 0.06835610419511795, "value_bot": 0.00634197099134326, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00360.png", "entropy": 0.6975279450416565} +{"ts": "2026-01-29T21:33:11.525476Z", "loop": 362, "env_steps": 222412800, "exact_value_avg": 0.31115901470184326, "regret_dist": 0.4926183521747589, "regret_other_env": 0.761193573474884, "regret_corner": 0.08975552022457123, "regret_row": 0.5867087244987488, "regret_any": 0.761193573474884, "regret_bot": 0.7900633811950684, "value_dist": 0.31115901470184326, "value_other_env": 0.06835950911045074, "value_corner": 0.675358235836029, "value_row": 0.20998027920722961, "value_any": 0.06835950911045074, "value_bot": 0.006625685840845108, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00362.png", "entropy": 0.6979615092277527} +{"ts": "2026-01-29T21:33:13.896921Z", "loop": 364, "env_steps": 223641600, "exact_value_avg": 0.31113314628601074, "regret_dist": 0.4926442503929138, "regret_other_env": 0.7611986994743347, "regret_corner": 0.0898125171661377, "regret_row": 0.5889249444007874, "regret_any": 0.7611986994743347, "regret_bot": 0.789911150932312, "value_dist": 0.31113314628601074, "value_other_env": 0.06835442781448364, "value_corner": 0.6753012537956238, "value_row": 0.20776407420635223, "value_any": 0.06835442781448364, "value_bot": 0.006777977105230093, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00364.png", "entropy": 0.6979548931121826} +{"ts": "2026-01-29T21:33:16.271367Z", "loop": 366, "env_steps": 224870400, "exact_value_avg": 0.31114476919174194, "regret_dist": 0.492632657289505, "regret_other_env": 0.7611966133117676, "regret_corner": 0.08978662639856339, "regret_row": 0.5884993672370911, "regret_any": 0.7611966133117676, "regret_bot": 0.7899402976036072, "value_dist": 0.31114476919174194, "value_other_env": 0.06835655868053436, "value_corner": 0.6753270626068115, "value_row": 0.20818963646888733, "value_any": 0.06835655868053436, "value_bot": 0.006748747546225786, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00366.png", "entropy": 0.6979824900627136} +{"ts": "2026-01-29T21:33:18.639763Z", "loop": 368, "env_steps": 226099200, "exact_value_avg": 0.31116151809692383, "regret_dist": 0.49261587858200073, "regret_other_env": 0.7611932158470154, "regret_corner": 0.08974983543157578, "regret_row": 0.5866121053695679, "regret_any": 0.7611932158470154, "regret_bot": 0.790069580078125, "value_dist": 0.31116151809692383, "value_other_env": 0.06835989654064178, "value_corner": 0.6753639578819275, "value_row": 0.2100769430398941, "value_any": 0.06835989654064178, "value_bot": 0.006619477644562721, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00368.png", "entropy": 0.6979666352272034} +{"ts": "2026-01-29T21:33:21.007581Z", "loop": 370, "env_steps": 227328000, "exact_value_avg": 0.31113484501838684, "regret_dist": 0.49264249205589294, "regret_other_env": 0.7611920237541199, "regret_corner": 0.08981819450855255, "regret_row": 0.5847133994102478, "regret_any": 0.7611920237541199, "regret_bot": 0.7901995778083801, "value_dist": 0.31113484501838684, "value_other_env": 0.06836105138063431, "value_corner": 0.6752955317497253, "value_row": 0.21197564899921417, "value_any": 0.06836105138063431, "value_bot": 0.006489494815468788, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00370.png", "entropy": 0.697847306728363} +{"ts": "2026-01-29T21:33:23.371568Z", "loop": 372, "env_steps": 228556800, "exact_value_avg": 0.3111165165901184, "regret_dist": 0.4926609396934509, "regret_other_env": 0.7611921429634094, "regret_corner": 0.08986402302980423, "regret_row": 0.5839288830757141, "regret_any": 0.7611921429634094, "regret_bot": 0.7902512550354004, "value_dist": 0.3111165165901184, "value_other_env": 0.06836102157831192, "value_corner": 0.6752497553825378, "value_row": 0.21276019513607025, "value_any": 0.06836102157831192, "value_bot": 0.006437762174755335, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00372.png", "entropy": 0.6977663040161133} +{"ts": "2026-01-29T21:33:25.742063Z", "loop": 374, "env_steps": 229785600, "exact_value_avg": 0.31115055084228516, "regret_dist": 0.4926268458366394, "regret_other_env": 0.7611922025680542, "regret_corner": 0.08977875858545303, "regret_row": 0.5853071212768555, "regret_any": 0.7611922025680542, "regret_bot": 0.7901585102081299, "value_dist": 0.31115055084228516, "value_other_env": 0.06836087256669998, "value_corner": 0.6753350496292114, "value_row": 0.21138198673725128, "value_any": 0.06836087256669998, "value_bot": 0.006530552636831999, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00374.png", "entropy": 0.6978594064712524} +{"ts": "2026-01-29T21:33:28.108448Z", "loop": 376, "env_steps": 231014400, "exact_value_avg": 0.3111482560634613, "regret_dist": 0.49262911081314087, "regret_other_env": 0.7611905336380005, "regret_corner": 0.08978696912527084, "regret_row": 0.5851783156394958, "regret_any": 0.7611905336380005, "regret_bot": 0.7901665568351746, "value_dist": 0.3111482560634613, "value_other_env": 0.06836255639791489, "value_corner": 0.6753267645835876, "value_row": 0.21151073276996613, "value_any": 0.06836255639791489, "value_bot": 0.0065224370919167995, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00376.png", "entropy": 0.6978914141654968} +{"ts": "2026-01-29T21:33:30.471410Z", "loop": 378, "env_steps": 232243200, "exact_value_avg": 0.31116387248039246, "regret_dist": 0.4926135241985321, "regret_other_env": 0.7611890435218811, "regret_corner": 0.08975023031234741, "regret_row": 0.586762547492981, "regret_any": 0.7611890435218811, "regret_bot": 0.7900593876838684, "value_dist": 0.31116387248039246, "value_other_env": 0.06836409121751785, "value_corner": 0.6753635406494141, "value_row": 0.20992645621299744, "value_any": 0.06836409121751785, "value_bot": 0.006629626266658306, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00378.png", "entropy": 0.6980254054069519} +{"ts": "2026-01-29T21:33:32.836055Z", "loop": 380, "env_steps": 233472000, "exact_value_avg": 0.3111454248428345, "regret_dist": 0.4926320016384125, "regret_other_env": 0.7611923217773438, "regret_corner": 0.08979151397943497, "regret_row": 0.5887103080749512, "regret_any": 0.7611923217773438, "regret_bot": 0.7899274826049805, "value_dist": 0.3111454248428345, "value_other_env": 0.06836085021495819, "value_corner": 0.6753222346305847, "value_row": 0.2079787701368332, "value_any": 0.06836085021495819, "value_bot": 0.006761536933481693, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00380.png", "entropy": 0.6980058550834656} +{"ts": "2026-01-29T21:33:35.211469Z", "loop": 382, "env_steps": 234700800, "exact_value_avg": 0.31111180782318115, "regret_dist": 0.4926655888557434, "regret_other_env": 0.7611951231956482, "regret_corner": 0.08987125009298325, "regret_row": 0.5900201797485352, "regret_any": 0.7611951231956482, "regret_bot": 0.7898363471031189, "value_dist": 0.31111180782318115, "value_other_env": 0.06835804134607315, "value_corner": 0.6752424836158752, "value_row": 0.2066689133644104, "value_any": 0.06835804134607315, "value_bot": 0.006852677091956139, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00382.png", "entropy": 0.6979884505271912} +{"ts": "2026-01-29T21:33:37.582885Z", "loop": 384, "env_steps": 235929600, "exact_value_avg": 0.31104135513305664, "regret_dist": 0.4927360713481903, "regret_other_env": 0.7612034678459167, "regret_corner": 0.09003488719463348, "regret_row": 0.5916107892990112, "regret_any": 0.7612034678459167, "regret_bot": 0.7897235751152039, "value_dist": 0.31104135513305664, "value_other_env": 0.0683496817946434, "value_corner": 0.6750788688659668, "value_row": 0.20507825911045074, "value_any": 0.0683496817946434, "value_bot": 0.006965454202145338, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00384.png", "entropy": 0.6978153586387634} +{"ts": "2026-01-29T21:33:39.952412Z", "loop": 386, "env_steps": 237158400, "exact_value_avg": 0.3109548091888428, "regret_dist": 0.4928225576877594, "regret_other_env": 0.7612128853797913, "regret_corner": 0.09023706614971161, "regret_row": 0.5931643843650818, "regret_any": 0.7612128853797913, "regret_bot": 0.7896127104759216, "value_dist": 0.3109548091888428, "value_other_env": 0.06834021955728531, "value_corner": 0.6748766899108887, "value_row": 0.2035246193408966, "value_any": 0.06834021955728531, "value_bot": 0.007076346781104803, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00386.png", "entropy": 0.697623074054718} +{"ts": "2026-01-29T21:33:42.316682Z", "loop": 388, "env_steps": 238387200, "exact_value_avg": 0.31105202436447144, "regret_dist": 0.4927254319190979, "regret_other_env": 0.7612025737762451, "regret_corner": 0.09000962227582932, "regret_row": 0.5915302634239197, "regret_any": 0.7612025737762451, "regret_bot": 0.7897287011146545, "value_dist": 0.31105202436447144, "value_other_env": 0.06835056096315384, "value_corner": 0.6751042008399963, "value_row": 0.2051587998867035, "value_any": 0.06835056096315384, "value_bot": 0.006960428785532713, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00388.png", "entropy": 0.6979417204856873} +{"ts": "2026-01-29T21:33:44.689801Z", "loop": 390, "env_steps": 239616000, "exact_value_avg": 0.31112366914749146, "regret_dist": 0.4926537275314331, "regret_other_env": 0.7611942291259766, "regret_corner": 0.08984289318323135, "regret_row": 0.5895562171936035, "regret_any": 0.7611942291259766, "regret_bot": 0.7898672223091125, "value_dist": 0.31112366914749146, "value_other_env": 0.0683588907122612, "value_corner": 0.6752708554267883, "value_row": 0.20713287591934204, "value_any": 0.0683588907122612, "value_bot": 0.006821843329817057, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00390.png", "entropy": 0.6981558799743652} +{"ts": "2026-01-29T21:33:47.049235Z", "loop": 392, "env_steps": 240844800, "exact_value_avg": 0.31116393208503723, "regret_dist": 0.49261340498924255, "regret_other_env": 0.7611866593360901, "regret_corner": 0.08975352346897125, "regret_row": 0.5865269303321838, "regret_any": 0.7611866593360901, "regret_bot": 0.7900748252868652, "value_dist": 0.31116393208503723, "value_other_env": 0.06836641579866409, "value_corner": 0.6753602027893066, "value_row": 0.21016213297843933, "value_any": 0.06836641579866409, "value_bot": 0.006614250130951405, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00392.png", "entropy": 0.6982975006103516} +{"ts": "2026-01-29T21:33:49.415027Z", "loop": 394, "env_steps": 242073600, "exact_value_avg": 0.31110960245132446, "regret_dist": 0.4926677644252777, "regret_other_env": 0.7611851692199707, "regret_corner": 0.08989164978265762, "regret_row": 0.5837421417236328, "regret_any": 0.7611851692199707, "regret_bot": 0.790262758731842, "value_dist": 0.31110960245132446, "value_other_env": 0.06836798787117004, "value_corner": 0.6752220392227173, "value_row": 0.21294693648815155, "value_any": 0.06836798787117004, "value_bot": 0.00642631808295846, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00394.png", "entropy": 0.698112964630127} +{"ts": "2026-01-29T21:33:51.781675Z", "loop": 396, "env_steps": 243302400, "exact_value_avg": 0.31096550822257996, "regret_dist": 0.4928118586540222, "regret_other_env": 0.7611957788467407, "regret_corner": 0.09023590385913849, "regret_row": 0.580780029296875, "regret_any": 0.7611957788467407, "regret_bot": 0.7904590964317322, "value_dist": 0.31096550822257996, "value_other_env": 0.06835728138685226, "value_corner": 0.6748778223991394, "value_row": 0.21590903401374817, "value_any": 0.06835728138685226, "value_bot": 0.00623004324734211, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00396.png", "entropy": 0.6974971294403076} +{"ts": "2026-01-29T21:33:54.142145Z", "loop": 398, "env_steps": 244531200, "exact_value_avg": 0.31094270944595337, "regret_dist": 0.4928346574306488, "regret_other_env": 0.7611992955207825, "regret_corner": 0.09028765559196472, "regret_row": 0.5804789066314697, "regret_any": 0.7611992955207825, "regret_bot": 0.7904784679412842, "value_dist": 0.31094270944595337, "value_other_env": 0.06835376471281052, "value_corner": 0.6748260855674744, "value_row": 0.21621012687683105, "value_any": 0.06835376471281052, "value_bot": 0.006210543680936098, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00398.png", "entropy": 0.6974253058433533} +{"ts": "2026-01-29T21:33:56.500988Z", "loop": 400, "env_steps": 245760000, "exact_value_avg": 0.3110029697418213, "regret_dist": 0.49277448654174805, "regret_other_env": 0.7611948251724243, "regret_corner": 0.09014387428760529, "regret_row": 0.581368088722229, "regret_any": 0.7611948251724243, "regret_bot": 0.7904200553894043, "value_dist": 0.3110029697418213, "value_other_env": 0.06835830211639404, "value_corner": 0.6749699115753174, "value_row": 0.21532101929187775, "value_any": 0.06835830211639404, "value_bot": 0.006269053090363741, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00400.png", "entropy": 0.6976034045219421} +{"ts": "2026-01-29T21:33:58.870066Z", "loop": 402, "env_steps": 246988800, "exact_value_avg": 0.31105247139930725, "regret_dist": 0.4927248954772949, "regret_other_env": 0.7611917853355408, "regret_corner": 0.09002453833818436, "regret_row": 0.5822027921676636, "regret_any": 0.7611917853355408, "regret_bot": 0.7903650999069214, "value_dist": 0.31105247139930725, "value_other_env": 0.0683613121509552, "value_corner": 0.6750891804695129, "value_row": 0.2144862711429596, "value_any": 0.0683613121509552, "value_bot": 0.006323943380266428, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00402.png", "entropy": 0.6976491212844849} +{"ts": "2026-01-29T21:34:01.231147Z", "loop": 404, "env_steps": 248217600, "exact_value_avg": 0.3110659420490265, "regret_dist": 0.4927114248275757, "regret_other_env": 0.7611879706382751, "regret_corner": 0.08999656140804291, "regret_row": 0.5822467803955078, "regret_any": 0.7611879706382751, "regret_bot": 0.7903615832328796, "value_dist": 0.3110659420490265, "value_other_env": 0.06836514174938202, "value_corner": 0.6751171350479126, "value_row": 0.21444225311279297, "value_any": 0.06836514174938202, "value_bot": 0.006327533628791571, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00404.png", "entropy": 0.6975792050361633} +{"ts": "2026-01-29T21:34:03.594853Z", "loop": 406, "env_steps": 249446400, "exact_value_avg": 0.31101152300834656, "regret_dist": 0.492765873670578, "regret_other_env": 0.7611909508705139, "regret_corner": 0.09012815356254578, "regret_row": 0.5812146663665771, "regret_any": 0.7611909508705139, "regret_bot": 0.7904301881790161, "value_dist": 0.31101152300834656, "value_other_env": 0.06836214661598206, "value_corner": 0.6749855875968933, "value_row": 0.21547436714172363, "value_any": 0.06836214661598206, "value_bot": 0.00625881040468812, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00406.png", "entropy": 0.6972285509109497} +{"ts": "2026-01-29T21:34:05.955337Z", "loop": 408, "env_steps": 250675200, "exact_value_avg": 0.31106144189834595, "regret_dist": 0.4927159547805786, "regret_other_env": 0.7611925601959229, "regret_corner": 0.09000102430582047, "regret_row": 0.5819851756095886, "regret_any": 0.7611925601959229, "regret_bot": 0.7903797030448914, "value_dist": 0.31106144189834595, "value_other_env": 0.06836055964231491, "value_corner": 0.6751127243041992, "value_row": 0.21470382809638977, "value_any": 0.06836055964231491, "value_bot": 0.006309289950877428, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00408.png", "entropy": 0.6973420977592468} +{"ts": "2026-01-29T21:34:08.316882Z", "loop": 410, "env_steps": 251904000, "exact_value_avg": 0.3111657500267029, "regret_dist": 0.4926116466522217, "regret_other_env": 0.7611924409866333, "regret_corner": 0.0897403433918953, "regret_row": 0.585058867931366, "regret_any": 0.7611924409866333, "regret_bot": 0.7901757955551147, "value_dist": 0.3111657500267029, "value_other_env": 0.06836068630218506, "value_corner": 0.675373375415802, "value_row": 0.2116301953792572, "value_any": 0.06836068630218506, "value_bot": 0.006513205356895924, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00410.png", "entropy": 0.6977403163909912} +{"ts": "2026-01-29T21:34:10.681644Z", "loop": 412, "env_steps": 253132800, "exact_value_avg": 0.31113356351852417, "regret_dist": 0.4926438629627228, "regret_other_env": 0.7612043619155884, "regret_corner": 0.08980301767587662, "regret_row": 0.589981734752655, "regret_any": 0.7612043619155884, "regret_bot": 0.7898408770561218, "value_dist": 0.31113356351852417, "value_other_env": 0.06834876537322998, "value_corner": 0.6753106713294983, "value_row": 0.20670729875564575, "value_any": 0.06834876537322998, "value_bot": 0.0068482160568237305, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00412.png", "entropy": 0.6976697444915771} +{"ts": "2026-01-29T21:34:13.041341Z", "loop": 414, "env_steps": 254361600, "exact_value_avg": 0.3108917772769928, "regret_dist": 0.4928855895996094, "regret_other_env": 0.7612296938896179, "regret_corner": 0.09036937355995178, "regret_row": 0.5943170189857483, "regret_any": 0.7612296938896179, "regret_bot": 0.789534866809845, "value_dist": 0.3108917772769928, "value_other_env": 0.06832335144281387, "value_corner": 0.6747443675994873, "value_row": 0.20237208902835846, "value_any": 0.06832335144281387, "value_bot": 0.007154213264584541, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00414.png", "entropy": 0.6968175172805786} +{"ts": "2026-01-29T21:34:15.402902Z", "loop": 416, "env_steps": 255590400, "exact_value_avg": 0.3105093240737915, "regret_dist": 0.49326807260513306, "regret_other_env": 0.761267900466919, "regret_corner": 0.09126830101013184, "regret_row": 0.5983140468597412, "regret_any": 0.761267900466919, "regret_bot": 0.789243757724762, "value_dist": 0.3105093240737915, "value_other_env": 0.06828520447015762, "value_corner": 0.6738454699516296, "value_row": 0.19837507605552673, "value_any": 0.06828520447015762, "value_bot": 0.007445267401635647, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00416.png", "entropy": 0.6953931450843811} +{"ts": "2026-01-29T21:34:17.761687Z", "loop": 418, "env_steps": 256819200, "exact_value_avg": 0.3106953799724579, "regret_dist": 0.4930819571018219, "regret_other_env": 0.7612550854682922, "regret_corner": 0.09082219749689102, "regret_row": 0.5966883301734924, "regret_any": 0.7612550854682922, "regret_bot": 0.7893638610839844, "value_dist": 0.3106953799724579, "value_other_env": 0.06829796731472015, "value_corner": 0.6742914915084839, "value_row": 0.20000076293945312, "value_any": 0.06829796731472015, "value_bot": 0.007325176615267992, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00418.png", "entropy": 0.6958819627761841} +{"ts": "2026-01-29T21:34:20.120372Z", "loop": 420, "env_steps": 258048000, "exact_value_avg": 0.31111323833465576, "regret_dist": 0.4926642179489136, "regret_other_env": 0.7612233757972717, "regret_corner": 0.08982542902231216, "regret_row": 0.5910024046897888, "regret_any": 0.7612233757972717, "regret_bot": 0.7897719740867615, "value_dist": 0.31111323833465576, "value_other_env": 0.06832979619503021, "value_corner": 0.6752883195877075, "value_row": 0.20568664371967316, "value_any": 0.06832979619503021, "value_bot": 0.006917063146829605, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00420.png", "entropy": 0.6970962285995483} +{"ts": "2026-01-29T21:34:22.482595Z", "loop": 422, "env_steps": 259276800, "exact_value_avg": 0.31118330359458923, "regret_dist": 0.49259406328201294, "regret_other_env": 0.7612152695655823, "regret_corner": 0.08966225385665894, "regret_row": 0.5851456522941589, "regret_any": 0.7612152695655823, "regret_bot": 0.7901745438575745, "value_dist": 0.31118330359458923, "value_other_env": 0.0683378279209137, "value_corner": 0.6754515171051025, "value_row": 0.21154338121414185, "value_any": 0.0683378279209137, "value_bot": 0.006514529697597027, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00422.png", "entropy": 0.6970853805541992} +{"ts": "2026-01-29T21:34:24.850013Z", "loop": 424, "env_steps": 260505600, "exact_value_avg": 0.310953289270401, "regret_dist": 0.49282410740852356, "regret_other_env": 0.7612305879592896, "regret_corner": 0.0902143344283104, "regret_row": 0.5800036191940308, "regret_any": 0.7612305879592896, "regret_bot": 0.7905134558677673, "value_dist": 0.310953289270401, "value_other_env": 0.06832250207662582, "value_corner": 0.6748994588851929, "value_row": 0.2166854292154312, "value_any": 0.06832250207662582, "value_bot": 0.0061755855567753315, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00424.png", "entropy": 0.6960200071334839} +{"ts": "2026-01-29T21:34:27.215559Z", "loop": 426, "env_steps": 261734400, "exact_value_avg": 0.31059128046035767, "regret_dist": 0.4931861162185669, "regret_other_env": 0.7612531185150146, "regret_corner": 0.09108560532331467, "regret_row": 0.5761982798576355, "regret_any": 0.7612531185150146, "regret_bot": 0.7907586097717285, "value_dist": 0.31059128046035767, "value_other_env": 0.06830001622438431, "value_corner": 0.6740281581878662, "value_row": 0.22049076855182648, "value_any": 0.06830001622438431, "value_bot": 0.005930424202233553, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00426.png", "entropy": 0.6945598125457764} +{"ts": "2026-01-29T21:34:29.579998Z", "loop": 428, "env_steps": 262963200, "exact_value_avg": 0.3107697665691376, "regret_dist": 0.4930076003074646, "regret_other_env": 0.7612451314926147, "regret_corner": 0.09065131843090057, "regret_row": 0.5777992606163025, "regret_any": 0.7612451314926147, "regret_bot": 0.7906595468521118, "value_dist": 0.3107697665691376, "value_other_env": 0.06830796599388123, "value_corner": 0.6744624376296997, "value_row": 0.2188897728919983, "value_any": 0.06830796599388123, "value_bot": 0.006029450334608555, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00428.png", "entropy": 0.6951026916503906} +{"ts": "2026-01-29T21:34:31.941061Z", "loop": 430, "env_steps": 264192000, "exact_value_avg": 0.3111523687839508, "regret_dist": 0.49262502789497375, "regret_other_env": 0.7612225413322449, "regret_corner": 0.08972867578268051, "regret_row": 0.5834167003631592, "regret_any": 0.7612225413322449, "regret_bot": 0.7902955412864685, "value_dist": 0.3111523687839508, "value_other_env": 0.0683305636048317, "value_corner": 0.675385057926178, "value_row": 0.2132723182439804, "value_any": 0.0683305636048317, "value_bot": 0.0063935271464288235, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00430.png", "entropy": 0.6964962482452393} +{"ts": "2026-01-29T21:34:34.302530Z", "loop": 432, "env_steps": 265420800, "exact_value_avg": 0.31116849184036255, "regret_dist": 0.492608904838562, "regret_other_env": 0.7612323760986328, "regret_corner": 0.08967358618974686, "regret_row": 0.589922308921814, "regret_any": 0.7612323760986328, "regret_bot": 0.7898535132408142, "value_dist": 0.31116849184036255, "value_other_env": 0.06832073628902435, "value_corner": 0.6754401326179504, "value_row": 0.2067667543888092, "value_any": 0.06832073628902435, "value_bot": 0.006835565436631441, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00432.png", "entropy": 0.6965876817703247} +{"ts": "2026-01-29T21:34:36.663779Z", "loop": 434, "env_steps": 266649600, "exact_value_avg": 0.31077003479003906, "regret_dist": 0.4930073618888855, "regret_other_env": 0.7612752914428711, "regret_corner": 0.09060540795326233, "regret_row": 0.5962564945220947, "regret_any": 0.7612752914428711, "regret_bot": 0.789401113986969, "value_dist": 0.31077003479003906, "value_other_env": 0.06827780604362488, "value_corner": 0.6745083332061768, "value_row": 0.20043255388736725, "value_any": 0.06827780604362488, "value_bot": 0.0072879428043961525, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00434.png", "entropy": 0.6951637268066406} +{"ts": "2026-01-29T21:34:39.027115Z", "loop": 436, "env_steps": 267878400, "exact_value_avg": 0.31067708134651184, "regret_dist": 0.49310028553009033, "regret_other_env": 0.7612869739532471, "regret_corner": 0.09082020074129105, "regret_row": 0.5972338318824768, "regret_any": 0.7612869739532471, "regret_bot": 0.7893288135528564, "value_dist": 0.31067708134651184, "value_other_env": 0.06826610863208771, "value_corner": 0.6742935180664062, "value_row": 0.19945526123046875, "value_any": 0.06826610863208771, "value_bot": 0.007360274437814951, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00436.png", "entropy": 0.6947342157363892} +{"ts": "2026-01-29T21:34:41.400395Z", "loop": 438, "env_steps": 269107200, "exact_value_avg": 0.31109100580215454, "regret_dist": 0.49268636107444763, "regret_other_env": 0.7612516283988953, "regret_corner": 0.0898384302854538, "regret_row": 0.592039942741394, "regret_any": 0.7612516283988953, "regret_bot": 0.7897052764892578, "value_dist": 0.31109100580215454, "value_other_env": 0.06830150634050369, "value_corner": 0.6752752661705017, "value_row": 0.20464913547039032, "value_any": 0.06830150634050369, "value_bot": 0.006983768194913864, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00438.png", "entropy": 0.6960510611534119} +{"ts": "2026-01-29T21:34:43.767980Z", "loop": 440, "env_steps": 270336000, "exact_value_avg": 0.31121620535850525, "regret_dist": 0.4925611615180969, "regret_other_env": 0.7612403035163879, "regret_corner": 0.08954242616891861, "regret_row": 0.5882536172866821, "regret_any": 0.7612403035163879, "regret_bot": 0.7899701595306396, "value_dist": 0.31121620535850525, "value_other_env": 0.06831277906894684, "value_corner": 0.6755713224411011, "value_row": 0.20843544602394104, "value_any": 0.06831277906894684, "value_bot": 0.006718918681144714, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00440.png", "entropy": 0.6963906288146973} +{"ts": "2026-01-29T21:34:46.136785Z", "loop": 442, "env_steps": 271564800, "exact_value_avg": 0.31122851371765137, "regret_dist": 0.4925489127635956, "regret_other_env": 0.761238157749176, "regret_corner": 0.08951500058174133, "regret_row": 0.5877567529678345, "regret_any": 0.761238157749176, "regret_bot": 0.7900037169456482, "value_dist": 0.31122851371765137, "value_other_env": 0.06831502914428711, "value_corner": 0.6755987405776978, "value_row": 0.2089322805404663, "value_any": 0.06831502914428711, "value_bot": 0.0066854143515229225, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00442.png", "entropy": 0.6963464021682739} +{"ts": "2026-01-29T21:34:48.500319Z", "loop": 444, "env_steps": 272793600, "exact_value_avg": 0.31123313307762146, "regret_dist": 0.4925442636013031, "regret_other_env": 0.7612372040748596, "regret_corner": 0.08950478583574295, "regret_row": 0.5872068405151367, "regret_any": 0.7612372040748596, "regret_bot": 0.7900423407554626, "value_dist": 0.31123313307762146, "value_other_env": 0.06831585615873337, "value_corner": 0.6756089925765991, "value_row": 0.20948222279548645, "value_any": 0.06831585615873337, "value_bot": 0.006646671332418919, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00444.png", "entropy": 0.696276068687439} +{"ts": "2026-01-29T21:34:50.859700Z", "loop": 446, "env_steps": 274022400, "exact_value_avg": 0.31123724579811096, "regret_dist": 0.4925401508808136, "regret_other_env": 0.7612354159355164, "regret_corner": 0.08949718624353409, "regret_row": 0.5861120820045471, "regret_any": 0.7612354159355164, "regret_bot": 0.7901178002357483, "value_dist": 0.31123724579811096, "value_other_env": 0.0683177039027214, "value_corner": 0.6756165623664856, "value_row": 0.21057701110839844, "value_any": 0.0683177039027214, "value_bot": 0.006571230478584766, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00446.png", "entropy": 0.6962255835533142} +{"ts": "2026-01-29T21:34:53.216959Z", "loop": 448, "env_steps": 275251200, "exact_value_avg": 0.3112225830554962, "regret_dist": 0.49255481362342834, "regret_other_env": 0.7612344026565552, "regret_corner": 0.08953540772199631, "regret_row": 0.5851638317108154, "regret_any": 0.7612344026565552, "regret_bot": 0.7901827692985535, "value_dist": 0.3112225830554962, "value_other_env": 0.06831873208284378, "value_corner": 0.6755783557891846, "value_row": 0.21152523159980774, "value_any": 0.06831873208284378, "value_bot": 0.00650629960000515, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00448.png", "entropy": 0.6961631774902344} +{"ts": "2026-01-29T21:34:55.573178Z", "loop": 450, "env_steps": 276480000, "exact_value_avg": 0.3111649751663208, "regret_dist": 0.49261245131492615, "regret_other_env": 0.761245846748352, "regret_corner": 0.08966227620840073, "regret_row": 0.5907859802246094, "regret_any": 0.761245846748352, "regret_bot": 0.7897965908050537, "value_dist": 0.3111649751663208, "value_other_env": 0.06830726563930511, "value_corner": 0.6754515171051025, "value_row": 0.2059030383825302, "value_any": 0.06830726563930511, "value_bot": 0.006892478559166193, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00450.png", "entropy": 0.6960145235061646} +{"ts": "2026-01-29T21:34:57.931275Z", "loop": 452, "env_steps": 277708800, "exact_value_avg": 0.3109041452407837, "regret_dist": 0.49287328124046326, "regret_other_env": 0.7612735629081726, "regret_corner": 0.09027282893657684, "regret_row": 0.5950657725334167, "regret_any": 0.7612735629081726, "regret_bot": 0.7894919514656067, "value_dist": 0.3109041452407837, "value_other_env": 0.06827959418296814, "value_corner": 0.6748409271240234, "value_row": 0.20162327587604523, "value_any": 0.06827959418296814, "value_bot": 0.007197092287242413, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00452.png", "entropy": 0.695091724395752} +{"ts": "2026-01-29T21:35:00.289190Z", "loop": 454, "env_steps": 278937600, "exact_value_avg": 0.31095436215400696, "regret_dist": 0.49282306432724, "regret_other_env": 0.7612714767456055, "regret_corner": 0.090150386095047, "regret_row": 0.5944527983665466, "regret_any": 0.7612714767456055, "regret_bot": 0.789536714553833, "value_dist": 0.31095436215400696, "value_other_env": 0.06828169524669647, "value_corner": 0.6749633550643921, "value_row": 0.20223626494407654, "value_any": 0.06828169524669647, "value_bot": 0.00715244747698307, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00454.png", "entropy": 0.6951731443405151} +{"ts": "2026-01-29T21:35:02.653110Z", "loop": 456, "env_steps": 280166400, "exact_value_avg": 0.3112405836582184, "regret_dist": 0.4925367534160614, "regret_other_env": 0.7612444758415222, "regret_corner": 0.0894751101732254, "regret_row": 0.5859794020652771, "regret_any": 0.7612444758415222, "regret_bot": 0.7901275157928467, "value_dist": 0.3112405836582184, "value_other_env": 0.06830857694149017, "value_corner": 0.6756386160850525, "value_row": 0.21070972084999084, "value_any": 0.06830857694149017, "value_bot": 0.006561479065567255, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00456.png", "entropy": 0.6959717869758606} +{"ts": "2026-01-29T21:35:05.013924Z", "loop": 458, "env_steps": 281395200, "exact_value_avg": 0.3109002411365509, "regret_dist": 0.49287712574005127, "regret_other_env": 0.7612642049789429, "regret_corner": 0.09029652923345566, "regret_row": 0.5789068937301636, "regret_any": 0.7612642049789429, "regret_bot": 0.790592610836029, "value_dist": 0.3109002411365509, "value_other_env": 0.0682888850569725, "value_corner": 0.6748172640800476, "value_row": 0.2177821397781372, "value_any": 0.0682888850569725, "value_bot": 0.006096454802900553, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00458.png", "entropy": 0.6946619153022766} +{"ts": "2026-01-29T21:35:07.386264Z", "loop": 460, "env_steps": 282624000, "exact_value_avg": 0.31063881516456604, "regret_dist": 0.49313855171203613, "regret_other_env": 0.7612786889076233, "regret_corner": 0.09092831611633301, "regret_row": 0.5762739777565002, "regret_any": 0.7612786889076233, "regret_bot": 0.7907599210739136, "value_dist": 0.31063881516456604, "value_other_env": 0.06827440112829208, "value_corner": 0.6741854548454285, "value_row": 0.22041505575180054, "value_any": 0.06827440112829208, "value_bot": 0.005929192993789911, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00460.png", "entropy": 0.6936936378479004} +{"ts": "2026-01-29T21:35:09.755046Z", "loop": 462, "env_steps": 283852800, "exact_value_avg": 0.3108871579170227, "regret_dist": 0.49289020895957947, "regret_other_env": 0.7612576484680176, "regret_corner": 0.0903390422463417, "regret_row": 0.5786481499671936, "regret_any": 0.7612576484680176, "regret_bot": 0.7906087040901184, "value_dist": 0.3108871579170227, "value_other_env": 0.06829545646905899, "value_corner": 0.674774706363678, "value_row": 0.21804092824459076, "value_any": 0.06829545646905899, "value_bot": 0.006080358289182186, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00462.png", "entropy": 0.6945959329605103} +{"ts": "2026-01-29T21:35:12.124887Z", "loop": 464, "env_steps": 285081600, "exact_value_avg": 0.3112186789512634, "regret_dist": 0.49255871772766113, "regret_other_env": 0.7612318992614746, "regret_corner": 0.08954892307519913, "regret_row": 0.5842639207839966, "regret_any": 0.7612318992614746, "regret_bot": 0.7902435064315796, "value_dist": 0.3112186789512634, "value_other_env": 0.06832121312618256, "value_corner": 0.6755648255348206, "value_row": 0.2124251276254654, "value_any": 0.06832121312618256, "value_bot": 0.006445570848882198, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00464.png", "entropy": 0.6958795785903931} +{"ts": "2026-01-29T21:35:14.510874Z", "loop": 466, "env_steps": 286310400, "exact_value_avg": 0.311256468296051, "regret_dist": 0.4925209879875183, "regret_other_env": 0.7612313032150269, "regret_corner": 0.08945543318986893, "regret_row": 0.5874751806259155, "regret_any": 0.7612313032150269, "regret_bot": 0.7900266647338867, "value_dist": 0.311256468296051, "value_other_env": 0.0683218464255333, "value_corner": 0.6756583452224731, "value_row": 0.20921385288238525, "value_any": 0.0683218464255333, "value_bot": 0.006662396714091301, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00466.png", "entropy": 0.6960943341255188} +{"ts": "2026-01-29T21:35:16.884704Z", "loop": 468, "env_steps": 287539200, "exact_value_avg": 0.31123608350753784, "regret_dist": 0.4925413727760315, "regret_other_env": 0.7612353563308716, "regret_corner": 0.0895003229379654, "regret_row": 0.588867723941803, "regret_any": 0.7612353563308716, "regret_bot": 0.7899293303489685, "value_dist": 0.31123608350753784, "value_other_env": 0.06831779330968857, "value_corner": 0.6756134629249573, "value_row": 0.207821324467659, "value_any": 0.06831779330968857, "value_bot": 0.006759675219655037, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00468.png", "entropy": 0.6961014270782471} +{"ts": "2026-01-29T21:35:19.247184Z", "loop": 470, "env_steps": 288768000, "exact_value_avg": 0.3112369775772095, "regret_dist": 0.4925404191017151, "regret_other_env": 0.761237382888794, "regret_corner": 0.08949495106935501, "regret_row": 0.5890148282051086, "regret_any": 0.761237382888794, "regret_bot": 0.7899166941642761, "value_dist": 0.3112369775772095, "value_other_env": 0.06831573694944382, "value_corner": 0.6756187677383423, "value_row": 0.20767426490783691, "value_any": 0.06831573694944382, "value_bot": 0.006772373337298632, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00470.png", "entropy": 0.696102499961853} +{"ts": "2026-01-29T21:35:21.609209Z", "loop": 472, "env_steps": 289996800, "exact_value_avg": 0.3112519681453705, "regret_dist": 0.4925253987312317, "regret_other_env": 0.7612408399581909, "regret_corner": 0.08945216238498688, "regret_row": 0.5880470275878906, "regret_any": 0.7612408399581909, "regret_bot": 0.7899844646453857, "value_dist": 0.3112519681453705, "value_other_env": 0.06831224262714386, "value_corner": 0.675661563873291, "value_row": 0.20864202082157135, "value_any": 0.06831224262714386, "value_bot": 0.0067046149633824825, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00472.png", "entropy": 0.6961092352867126} +{"ts": "2026-01-29T21:35:23.982164Z", "loop": 474, "env_steps": 291225600, "exact_value_avg": 0.31125524640083313, "regret_dist": 0.49252215027809143, "regret_other_env": 0.7612427473068237, "regret_corner": 0.08944121748209, "regret_row": 0.5874075889587402, "regret_any": 0.7612427473068237, "regret_bot": 0.7900269031524658, "value_dist": 0.31125524640083313, "value_other_env": 0.06831040978431702, "value_corner": 0.6756725311279297, "value_row": 0.20928150415420532, "value_any": 0.06831040978431702, "value_bot": 0.006662135943770409, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00474.png", "entropy": 0.6961424946784973} +{"ts": "2026-01-29T21:35:26.345627Z", "loop": 476, "env_steps": 292454400, "exact_value_avg": 0.31125369668006897, "regret_dist": 0.4925236701965332, "regret_other_env": 0.7612432241439819, "regret_corner": 0.08944432437419891, "regret_row": 0.5880313515663147, "regret_any": 0.7612432241439819, "regret_bot": 0.7899852395057678, "value_dist": 0.31125369668006897, "value_other_env": 0.06830988824367523, "value_corner": 0.6756693720817566, "value_row": 0.20865769684314728, "value_any": 0.06830988824367523, "value_bot": 0.0067037553526461124, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00476.png", "entropy": 0.6961640119552612} +{"ts": "2026-01-29T21:35:28.707313Z", "loop": 478, "env_steps": 293683200, "exact_value_avg": 0.31125006079673767, "regret_dist": 0.4925273060798645, "regret_other_env": 0.7612422108650208, "regret_corner": 0.08945483714342117, "regret_row": 0.5883274078369141, "regret_any": 0.7612422108650208, "regret_bot": 0.7899646162986755, "value_dist": 0.31125006079673767, "value_other_env": 0.06831089407205582, "value_corner": 0.6756588220596313, "value_row": 0.20836162567138672, "value_any": 0.06831089407205582, "value_bot": 0.0067244600504636765, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00478.png", "entropy": 0.696158766746521} +{"ts": "2026-01-29T21:35:31.071484Z", "loop": 480, "env_steps": 294912000, "exact_value_avg": 0.3112589120864868, "regret_dist": 0.49251845479011536, "regret_other_env": 0.7612355351448059, "regret_corner": 0.08944280445575714, "regret_row": 0.58653324842453, "regret_any": 0.7612355351448059, "regret_bot": 0.7900860905647278, "value_dist": 0.3112589120864868, "value_other_env": 0.06831756234169006, "value_corner": 0.6756709218025208, "value_row": 0.21015578508377075, "value_any": 0.06831756234169006, "value_bot": 0.006602925714105368, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00480.png", "entropy": 0.6961852312088013} +{"ts": "2026-01-29T21:35:33.446820Z", "loop": 482, "env_steps": 296140800, "exact_value_avg": 0.3112544119358063, "regret_dist": 0.4925229847431183, "regret_other_env": 0.7612361311912537, "regret_corner": 0.08945325762033463, "regret_row": 0.5861046314239502, "regret_any": 0.7612361311912537, "regret_bot": 0.7901151180267334, "value_dist": 0.3112544119358063, "value_other_env": 0.06831701844930649, "value_corner": 0.6756604909896851, "value_row": 0.21058443188667297, "value_any": 0.06831701844930649, "value_bot": 0.006573859602212906, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00482.png", "entropy": 0.6961876749992371} +{"ts": "2026-01-29T21:35:35.809796Z", "loop": 484, "env_steps": 297369600, "exact_value_avg": 0.31124868988990784, "regret_dist": 0.4925287067890167, "regret_other_env": 0.7612351775169373, "regret_corner": 0.08946896344423294, "regret_row": 0.585431694984436, "regret_any": 0.7612351775169373, "regret_bot": 0.7901596426963806, "value_dist": 0.31124868988990784, "value_other_env": 0.06831792742013931, "value_corner": 0.6756447553634644, "value_row": 0.21125732362270355, "value_any": 0.06831792742013931, "value_bot": 0.006529470440000296, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00484.png", "entropy": 0.6961620450019836} +{"ts": "2026-01-29T21:35:38.175259Z", "loop": 486, "env_steps": 298598400, "exact_value_avg": 0.3111903667449951, "regret_dist": 0.49258702993392944, "regret_other_env": 0.7612385749816895, "regret_corner": 0.08960967510938644, "regret_row": 0.5831961035728455, "regret_any": 0.7612385749816895, "regret_bot": 0.7903079390525818, "value_dist": 0.3111903667449951, "value_other_env": 0.06831454485654831, "value_corner": 0.6755040287971497, "value_row": 0.21349290013313293, "value_any": 0.06831454485654831, "value_bot": 0.006381120067089796, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00486.png", "entropy": 0.6959277987480164} +{"ts": "2026-01-29T21:35:40.536339Z", "loop": 488, "env_steps": 299827200, "exact_value_avg": 0.31122320890426636, "regret_dist": 0.4925541281700134, "regret_other_env": 0.761239767074585, "regret_corner": 0.08952566981315613, "regret_row": 0.5838889479637146, "regret_any": 0.761239767074585, "regret_bot": 0.7902629971504211, "value_dist": 0.31122320890426636, "value_other_env": 0.06831327825784683, "value_corner": 0.675588071346283, "value_row": 0.21280013024806976, "value_any": 0.06831327825784683, "value_bot": 0.0064260344952344894, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00488.png", "entropy": 0.6959860324859619} +{"ts": "2026-01-29T21:35:42.895849Z", "loop": 490, "env_steps": 301056000, "exact_value_avg": 0.3112269937992096, "regret_dist": 0.4925503432750702, "regret_other_env": 0.7612477540969849, "regret_corner": 0.08950422704219818, "regret_row": 0.5897831320762634, "regret_any": 0.7612477540969849, "regret_bot": 0.789865255355835, "value_dist": 0.3112269937992096, "value_other_env": 0.06830533593893051, "value_corner": 0.6756094694137573, "value_row": 0.20690588653087616, "value_any": 0.06830533593893051, "value_bot": 0.0068237693049013615, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00490.png", "entropy": 0.69612056016922} +{"ts": "2026-01-29T21:35:45.259816Z", "loop": 492, "env_steps": 302284800, "exact_value_avg": 0.31112349033355713, "regret_dist": 0.4926539361476898, "regret_other_env": 0.7612589001655579, "regret_corner": 0.08974641561508179, "regret_row": 0.5923125743865967, "regret_any": 0.7612589001655579, "regret_bot": 0.7896903157234192, "value_dist": 0.31112349033355713, "value_other_env": 0.06829424947500229, "value_corner": 0.6753673553466797, "value_row": 0.20437651872634888, "value_any": 0.06829424947500229, "value_bot": 0.006998783443123102, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00492.png", "entropy": 0.6957374215126038} +{"ts": "2026-01-29T21:35:47.631986Z", "loop": 494, "env_steps": 303513600, "exact_value_avg": 0.3111516833305359, "regret_dist": 0.49262571334838867, "regret_other_env": 0.7612555027008057, "regret_corner": 0.08968096226453781, "regret_row": 0.5919230580329895, "regret_any": 0.7612555027008057, "regret_bot": 0.7897177934646606, "value_dist": 0.3111516833305359, "value_other_env": 0.0682976245880127, "value_corner": 0.6754327416419983, "value_row": 0.20476599037647247, "value_any": 0.0682976245880127, "value_bot": 0.006971312221139669, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00494.png", "entropy": 0.6957358121871948} +{"ts": "2026-01-29T21:35:50.002834Z", "loop": 496, "env_steps": 304742400, "exact_value_avg": 0.3112821877002716, "regret_dist": 0.49249517917633057, "regret_other_env": 0.7612393498420715, "regret_corner": 0.08937890082597733, "regret_row": 0.5877806544303894, "regret_any": 0.7612393498420715, "regret_bot": 0.7900010347366333, "value_dist": 0.3112821877002716, "value_other_env": 0.06831371784210205, "value_corner": 0.6757348775863647, "value_row": 0.20890842378139496, "value_any": 0.06831371784210205, "value_bot": 0.006688002031296492, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00496.png", "entropy": 0.6960512399673462} +{"ts": "2026-01-29T21:35:52.364180Z", "loop": 498, "env_steps": 305971200, "exact_value_avg": 0.3111344277858734, "regret_dist": 0.49264293909072876, "regret_other_env": 0.7612432241439819, "regret_corner": 0.08974248915910721, "regret_row": 0.5818058848381042, "regret_any": 0.7612432241439819, "regret_bot": 0.7903989553451538, "value_dist": 0.3111344277858734, "value_other_env": 0.06830990314483643, "value_corner": 0.6753712296485901, "value_row": 0.21488317847251892, "value_any": 0.06830990314483643, "value_bot": 0.006290117744356394, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00498.png", "entropy": 0.6954476237297058} +{"ts": "2026-01-29T21:35:54.726563Z", "loop": 500, "env_steps": 307200000, "exact_value_avg": 0.3104945719242096, "regret_dist": 0.49328282475471497, "regret_other_env": 0.7612892389297485, "regret_corner": 0.0912732183933258, "regret_row": 0.5748467445373535, "regret_any": 0.7612892389297485, "regret_bot": 0.7908442616462708, "value_dist": 0.3104945719242096, "value_other_env": 0.06826392561197281, "value_corner": 0.6738405227661133, "value_row": 0.22184234857559204, "value_any": 0.06826392561197281, "value_bot": 0.005844801664352417, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00500.png", "entropy": 0.6931332945823669} +{"ts": "2026-01-29T21:36:00.574278Z", "loop": 505, "env_steps": 310272000, "exact_value_avg": 0.3107210397720337, "regret_dist": 0.4930563271045685, "regret_other_env": 0.7612791657447815, "regret_corner": 0.09072202444076538, "regret_row": 0.576809823513031, "regret_any": 0.7612791657447815, "regret_bot": 0.790723443031311, "value_dist": 0.3107210397720337, "value_other_env": 0.0682738870382309, "value_corner": 0.6743917465209961, "value_row": 0.21987923979759216, "value_any": 0.0682738870382309, "value_bot": 0.005965565796941519, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00505.png", "entropy": 0.6941984295845032} +{"ts": "2026-01-29T21:36:06.419649Z", "loop": 510, "env_steps": 313344000, "exact_value_avg": 0.31056541204452515, "regret_dist": 0.4932119846343994, "regret_other_env": 0.7613003253936768, "regret_corner": 0.09107936173677444, "regret_row": 0.5985926985740662, "regret_any": 0.7613003253936768, "regret_bot": 0.789232075214386, "value_dist": 0.31056541204452515, "value_other_env": 0.06825277954339981, "value_corner": 0.6740343570709229, "value_row": 0.1980963498353958, "value_any": 0.06825277954339981, "value_bot": 0.007457023486495018, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00510.png", "entropy": 0.6943655610084534} +{"ts": "2026-01-29T21:36:12.265894Z", "loop": 515, "env_steps": 316416000, "exact_value_avg": 0.3112090229988098, "regret_dist": 0.49256831407546997, "regret_other_env": 0.7612391710281372, "regret_corner": 0.08956204354763031, "regret_row": 0.5906755924224854, "regret_any": 0.7612391710281372, "regret_bot": 0.7897998690605164, "value_dist": 0.3112090229988098, "value_other_env": 0.06831393390893936, "value_corner": 0.6755516529083252, "value_row": 0.2060135304927826, "value_any": 0.06831393390893936, "value_bot": 0.006889219395816326, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00515.png", "entropy": 0.6965973973274231} +{"ts": "2026-01-29T21:36:18.111593Z", "loop": 520, "env_steps": 319488000, "exact_value_avg": 0.3105027675628662, "regret_dist": 0.49327462911605835, "regret_other_env": 0.7612825632095337, "regret_corner": 0.09126264601945877, "regret_row": 0.5749693512916565, "regret_any": 0.7612825632095337, "regret_bot": 0.790837287902832, "value_dist": 0.3105027675628662, "value_other_env": 0.06827054172754288, "value_corner": 0.6738510727882385, "value_row": 0.2217196822166443, "value_any": 0.06827054172754288, "value_bot": 0.005851775873452425, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00520.png", "entropy": 0.6939330697059631} +{"ts": "2026-01-29T21:36:23.959674Z", "loop": 525, "env_steps": 322560000, "exact_value_avg": 0.31098389625549316, "regret_dist": 0.49279356002807617, "regret_other_env": 0.7612526416778564, "regret_corner": 0.090104840695858, "regret_row": 0.5794150233268738, "regret_any": 0.7612526416778564, "regret_bot": 0.7905551791191101, "value_dist": 0.31098389625549316, "value_other_env": 0.06830048561096191, "value_corner": 0.6750089526176453, "value_row": 0.217274010181427, "value_any": 0.06830048561096191, "value_bot": 0.006133930291980505, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00525.png", "entropy": 0.6954683065414429} +{"ts": "2026-01-29T21:36:29.795888Z", "loop": 530, "env_steps": 325632000, "exact_value_avg": 0.31084901094436646, "regret_dist": 0.4929283857345581, "regret_other_env": 0.7612740993499756, "regret_corner": 0.0904097780585289, "regret_row": 0.5960649251937866, "regret_any": 0.7612740993499756, "regret_bot": 0.7894185185432434, "value_dist": 0.31084901094436646, "value_other_env": 0.06827906519174576, "value_corner": 0.6747039556503296, "value_row": 0.20062410831451416, "value_any": 0.06827906519174576, "value_bot": 0.007270477712154388, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00530.png", "entropy": 0.6953476071357727} +{"ts": "2026-01-29T21:36:35.631701Z", "loop": 535, "env_steps": 328704000, "exact_value_avg": 0.31073281168937683, "regret_dist": 0.49304455518722534, "regret_other_env": 0.761296808719635, "regret_corner": 0.09066610783338547, "regret_row": 0.5973970890045166, "regret_any": 0.761296808719635, "regret_bot": 0.7893227338790894, "value_dist": 0.31073281168937683, "value_other_env": 0.06825626641511917, "value_corner": 0.6744475960731506, "value_row": 0.19929195940494537, "value_any": 0.06825626641511917, "value_bot": 0.007366281468421221, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00535.png", "entropy": 0.69463050365448} +{"ts": "2026-01-29T21:36:41.474487Z", "loop": 540, "env_steps": 331776000, "exact_value_avg": 0.3112812042236328, "regret_dist": 0.49249616265296936, "regret_other_env": 0.7612550854682922, "regret_corner": 0.08935771137475967, "regret_row": 0.5893591642379761, "regret_any": 0.7612550854682922, "regret_bot": 0.7898964285850525, "value_dist": 0.3112812042236328, "value_other_env": 0.06829800456762314, "value_corner": 0.67575603723526, "value_row": 0.2073298990726471, "value_any": 0.06829800456762314, "value_bot": 0.0067925481125712395, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00540.png", "entropy": 0.6960991024971008} +{"ts": "2026-01-29T21:36:47.346866Z", "loop": 545, "env_steps": 334848000, "exact_value_avg": 0.3110560178756714, "regret_dist": 0.4927213490009308, "regret_other_env": 0.7612653374671936, "regret_corner": 0.08990536630153656, "regret_row": 0.5800558924674988, "regret_any": 0.7612653374671936, "regret_bot": 0.7905176281929016, "value_dist": 0.3110560178756714, "value_other_env": 0.06828779727220535, "value_corner": 0.675208330154419, "value_row": 0.21663320064544678, "value_any": 0.06828779727220535, "value_bot": 0.0061714365147054195, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00545.png", "entropy": 0.6950972080230713} +{"ts": "2026-01-29T21:36:53.205589Z", "loop": 550, "env_steps": 337920000, "exact_value_avg": 0.3112677335739136, "regret_dist": 0.4925095736980438, "regret_other_env": 0.7612608671188354, "regret_corner": 0.08938263356685638, "regret_row": 0.5903659462928772, "regret_any": 0.7612608671188354, "regret_bot": 0.7898281812667847, "value_dist": 0.3112677335739136, "value_other_env": 0.06829217076301575, "value_corner": 0.6757310628890991, "value_row": 0.20632311701774597, "value_any": 0.06829217076301575, "value_bot": 0.006860882975161076, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00550.png", "entropy": 0.6959137916564941} +{"ts": "2026-01-29T21:36:59.069798Z", "loop": 555, "env_steps": 340992000, "exact_value_avg": 0.3104470372200012, "regret_dist": 0.49333032965660095, "regret_other_env": 0.7613367438316345, "regret_corner": 0.09132062643766403, "regret_row": 0.5999739170074463, "regret_any": 0.7613367438316345, "regret_bot": 0.789132833480835, "value_dist": 0.3104470372200012, "value_other_env": 0.06821630895137787, "value_corner": 0.6737930774688721, "value_row": 0.19671514630317688, "value_any": 0.06821630895137787, "value_bot": 0.007556264754384756, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00555.png", "entropy": 0.6933533549308777} +{"ts": "2026-01-29T21:37:04.921661Z", "loop": 560, "env_steps": 344064000, "exact_value_avg": 0.3111395537853241, "regret_dist": 0.4926378130912781, "regret_other_env": 0.761269211769104, "regret_corner": 0.08969065546989441, "regret_row": 0.5929062962532043, "regret_any": 0.761269211769104, "regret_bot": 0.7896487712860107, "value_dist": 0.3111395537853241, "value_other_env": 0.06828386336565018, "value_corner": 0.6754230856895447, "value_row": 0.20378276705741882, "value_any": 0.06828386336565018, "value_bot": 0.007040292955935001, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00560.png", "entropy": 0.6958786249160767} +{"ts": "2026-01-29T21:37:10.771479Z", "loop": 565, "env_steps": 347136000, "exact_value_avg": 0.3113134503364563, "regret_dist": 0.4924639165401459, "regret_other_env": 0.761241614818573, "regret_corner": 0.08929731696844101, "regret_row": 0.5876027941703796, "regret_any": 0.761241614818573, "regret_bot": 0.7900170087814331, "value_dist": 0.3113134503364563, "value_other_env": 0.06831151247024536, "value_corner": 0.6758163571357727, "value_row": 0.20908625423908234, "value_any": 0.06831151247024536, "value_bot": 0.006672062911093235, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00565.png", "entropy": 0.6967537999153137} +{"ts": "2026-01-29T21:37:16.628998Z", "loop": 570, "env_steps": 350208000, "exact_value_avg": 0.3112494647502899, "regret_dist": 0.49252796173095703, "regret_other_env": 0.7612365484237671, "regret_corner": 0.08946499973535538, "regret_row": 0.5835890769958496, "regret_any": 0.7612365484237671, "regret_bot": 0.7902832627296448, "value_dist": 0.3112494647502899, "value_other_env": 0.06831654906272888, "value_corner": 0.6756488084793091, "value_row": 0.21310003101825714, "value_any": 0.06831654906272888, "value_bot": 0.006405770778656006, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00570.png", "entropy": 0.6968011856079102} +{"ts": "2026-01-29T21:37:22.482629Z", "loop": 575, "env_steps": 353280000, "exact_value_avg": 0.31130731105804443, "regret_dist": 0.49247002601623535, "regret_other_env": 0.7612292766571045, "regret_corner": 0.08933112770318985, "regret_row": 0.5880570411682129, "regret_any": 0.7612292766571045, "regret_bot": 0.7899842262268066, "value_dist": 0.31130731105804443, "value_other_env": 0.06832382082939148, "value_corner": 0.6757825613021851, "value_row": 0.20863202214241028, "value_any": 0.06832382082939148, "value_bot": 0.0067048585042357445, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00575.png", "entropy": 0.6972960233688354} +{"ts": "2026-01-29T21:37:28.323830Z", "loop": 580, "env_steps": 356352000, "exact_value_avg": 0.311282217502594, "regret_dist": 0.49249517917633057, "regret_other_env": 0.7612438797950745, "regret_corner": 0.08937209844589233, "regret_row": 0.589826226234436, "regret_any": 0.7612438797950745, "regret_bot": 0.7898635268211365, "value_dist": 0.311282217502594, "value_other_env": 0.06830926984548569, "value_corner": 0.6757416129112244, "value_row": 0.20686274766921997, "value_any": 0.06830926984548569, "value_bot": 0.006825491786003113, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00580.png", "entropy": 0.6970637440681458} +{"ts": "2026-01-29T21:37:34.174506Z", "loop": 585, "env_steps": 359424000, "exact_value_avg": 0.31132280826568604, "regret_dist": 0.49245455861091614, "regret_other_env": 0.7612393498420715, "regret_corner": 0.08927731961011887, "regret_row": 0.5854607224464417, "regret_any": 0.7612393498420715, "regret_bot": 0.7901608943939209, "value_dist": 0.31132280826568604, "value_other_env": 0.06831373274326324, "value_corner": 0.675836443901062, "value_row": 0.21122831106185913, "value_any": 0.06831373274326324, "value_bot": 0.006528182420879602, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00585.png", "entropy": 0.6968191862106323} +{"ts": "2026-01-29T21:37:40.015410Z", "loop": 590, "env_steps": 362496000, "exact_value_avg": 0.3108358383178711, "regret_dist": 0.49294155836105347, "regret_other_env": 0.7612771987915039, "regret_corner": 0.09043803811073303, "regret_row": 0.577210009098053, "regret_any": 0.7612771987915039, "regret_bot": 0.790701150894165, "value_dist": 0.3108358383178711, "value_other_env": 0.06827598810195923, "value_corner": 0.6746756434440613, "value_row": 0.219479039311409, "value_any": 0.06827598810195923, "value_bot": 0.005987903568893671, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00590.png", "entropy": 0.6946672797203064} +{"ts": "2026-01-29T21:37:45.855365Z", "loop": 595, "env_steps": 365568000, "exact_value_avg": 0.31090855598449707, "regret_dist": 0.4928688406944275, "regret_other_env": 0.761285126209259, "regret_corner": 0.0902443453669548, "regret_row": 0.5778873562812805, "regret_any": 0.761285126209259, "regret_bot": 0.7906603813171387, "value_dist": 0.31090855598449707, "value_other_env": 0.06826804578304291, "value_corner": 0.6748692989349365, "value_row": 0.21880166232585907, "value_any": 0.06826804578304291, "value_bot": 0.006028686184436083, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00595.png", "entropy": 0.6945942044258118} +{"ts": "2026-01-29T21:37:51.699986Z", "loop": 600, "env_steps": 368640000, "exact_value_avg": 0.31136763095855713, "regret_dist": 0.4924098253250122, "regret_other_env": 0.7612584233283997, "regret_corner": 0.08913684636354446, "regret_row": 0.5873236060142517, "regret_any": 0.7612584233283997, "regret_bot": 0.7900421619415283, "value_dist": 0.31136763095855713, "value_other_env": 0.06829474121332169, "value_corner": 0.6759769320487976, "value_row": 0.20936542749404907, "value_any": 0.06829474121332169, "value_bot": 0.0066468301229178905, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00600.png", "entropy": 0.6961453557014465} +{"ts": "2026-01-29T21:37:57.544270Z", "loop": 605, "env_steps": 371712000, "exact_value_avg": 0.3111541271209717, "regret_dist": 0.4926232695579529, "regret_other_env": 0.7612870335578918, "regret_corner": 0.08962760865688324, "regret_row": 0.5936815738677979, "regret_any": 0.7612870335578918, "regret_bot": 0.7896011471748352, "value_dist": 0.3111541271209717, "value_other_env": 0.06826609373092651, "value_corner": 0.675486147403717, "value_row": 0.20300747454166412, "value_any": 0.06826609373092651, "value_bot": 0.007087905425578356, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00605.png", "entropy": 0.6953420042991638} +{"ts": "2026-01-29T21:38:03.382220Z", "loop": 610, "env_steps": 374784000, "exact_value_avg": 0.31133437156677246, "regret_dist": 0.4924430251121521, "regret_other_env": 0.7612674832344055, "regret_corner": 0.08920629322528839, "regret_row": 0.584090530872345, "regret_any": 0.7612674832344055, "regret_bot": 0.7902604341506958, "value_dist": 0.31133437156677246, "value_other_env": 0.06828568875789642, "value_corner": 0.6759074330329895, "value_row": 0.2125985473394394, "value_any": 0.06828568875789642, "value_bot": 0.006428686436265707, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00610.png", "entropy": 0.6958807110786438} +{"ts": "2026-01-29T21:38:09.229077Z", "loop": 615, "env_steps": 377856000, "exact_value_avg": 0.3113388121128082, "regret_dist": 0.49243858456611633, "regret_other_env": 0.7612558603286743, "regret_corner": 0.08921264111995697, "regret_row": 0.5840698480606079, "regret_any": 0.7612558603286743, "regret_bot": 0.7902607917785645, "value_dist": 0.3113388121128082, "value_other_env": 0.06829727441072464, "value_corner": 0.6759010553359985, "value_row": 0.21261915564537048, "value_any": 0.06829727441072464, "value_bot": 0.006428265944123268, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00615.png", "entropy": 0.6961362957954407} +{"ts": "2026-01-29T21:38:15.074474Z", "loop": 620, "env_steps": 380928000, "exact_value_avg": 0.3112499713897705, "regret_dist": 0.49252739548683167, "regret_other_env": 0.7612752914428711, "regret_corner": 0.08940544724464417, "regret_row": 0.5923583507537842, "regret_any": 0.7612752914428711, "regret_bot": 0.7896943092346191, "value_dist": 0.3112499713897705, "value_other_env": 0.0682777687907219, "value_corner": 0.6757082939147949, "value_row": 0.204330712556839, "value_any": 0.0682777687907219, "value_bot": 0.006994706112891436, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00620.png", "entropy": 0.6958762407302856} +{"ts": "2026-01-29T21:38:20.915102Z", "loop": 625, "env_steps": 384000000, "exact_value_avg": 0.3112727403640747, "regret_dist": 0.4925045967102051, "regret_other_env": 0.7612669467926025, "regret_corner": 0.08936100453138351, "regret_row": 0.5820664763450623, "regret_any": 0.7612669467926025, "regret_bot": 0.7903928756713867, "value_dist": 0.3112727403640747, "value_other_env": 0.06828613579273224, "value_corner": 0.6757526993751526, "value_row": 0.21462254226207733, "value_any": 0.06828613579273224, "value_bot": 0.006296176463365555, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00625.png", "entropy": 0.695650041103363} +{"ts": "2026-01-29T21:38:26.757008Z", "loop": 630, "env_steps": 387072000, "exact_value_avg": 0.31135094165802, "regret_dist": 0.49242642521858215, "regret_other_env": 0.7612665295600891, "regret_corner": 0.08916623890399933, "regret_row": 0.5836056470870972, "regret_any": 0.7612665295600891, "regret_bot": 0.7902928590774536, "value_dist": 0.31135094165802, "value_other_env": 0.06828658282756805, "value_corner": 0.6759474873542786, "value_row": 0.21308337152004242, "value_any": 0.06828658282756805, "value_bot": 0.006396106444299221, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00630.png", "entropy": 0.6957986950874329} +{"ts": "2026-01-29T21:38:32.607827Z", "loop": 635, "env_steps": 390144000, "exact_value_avg": 0.31113940477371216, "regret_dist": 0.49263796210289, "regret_other_env": 0.761298418045044, "regret_corner": 0.08964724838733673, "regret_row": 0.5945407748222351, "regret_any": 0.761298418045044, "regret_bot": 0.7895439267158508, "value_dist": 0.31113940477371216, "value_other_env": 0.0682547390460968, "value_corner": 0.6754664182662964, "value_row": 0.2021481990814209, "value_any": 0.0682547390460968, "value_bot": 0.007145199459046125, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00635.png", "entropy": 0.6949710845947266} +{"ts": "2026-01-29T21:38:38.452369Z", "loop": 640, "env_steps": 393216000, "exact_value_avg": 0.3113672435283661, "regret_dist": 0.49241018295288086, "regret_other_env": 0.7612907290458679, "regret_corner": 0.08908934891223907, "regret_row": 0.5910292863845825, "regret_any": 0.7612907290458679, "regret_bot": 0.7897981405258179, "value_dist": 0.3113672435283661, "value_other_env": 0.06826242059469223, "value_corner": 0.6760244369506836, "value_row": 0.20565970242023468, "value_any": 0.06826242059469223, "value_bot": 0.006890964228659868, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00640.png", "entropy": 0.6954384446144104} +{"ts": "2026-01-29T21:38:44.301368Z", "loop": 645, "env_steps": 396288000, "exact_value_avg": 0.31088557839393616, "regret_dist": 0.4928918182849884, "regret_other_env": 0.7613192200660706, "regret_corner": 0.090250663459301, "regret_row": 0.5768530964851379, "regret_any": 0.7613192200660706, "regret_bot": 0.7907350063323975, "value_dist": 0.31088557839393616, "value_other_env": 0.0682338997721672, "value_corner": 0.6748631000518799, "value_row": 0.21983593702316284, "value_any": 0.0682338997721672, "value_bot": 0.005954129155725241, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00645.png", "entropy": 0.6933513283729553} +{"ts": "2026-01-29T21:38:50.146377Z", "loop": 650, "env_steps": 399360000, "exact_value_avg": 0.3109634518623352, "regret_dist": 0.49281397461891174, "regret_other_env": 0.7613173723220825, "regret_corner": 0.0900588259100914, "regret_row": 0.5774439573287964, "regret_any": 0.7613173723220825, "regret_bot": 0.790697455406189, "value_dist": 0.3109634518623352, "value_other_env": 0.06823575496673584, "value_corner": 0.6750549674034119, "value_row": 0.2192450761795044, "value_any": 0.06823575496673584, "value_bot": 0.0059915524907410145, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00650.png", "entropy": 0.6934873461723328} +{"ts": "2026-01-29T21:38:55.987139Z", "loop": 655, "env_steps": 402432000, "exact_value_avg": 0.31148040294647217, "regret_dist": 0.4922969937324524, "regret_other_env": 0.7612900733947754, "regret_corner": 0.0888073742389679, "regret_row": 0.5873233675956726, "regret_any": 0.7612900733947754, "regret_bot": 0.790055513381958, "value_dist": 0.31148040294647217, "value_other_env": 0.06826304644346237, "value_corner": 0.6763063669204712, "value_row": 0.20936569571495056, "value_any": 0.06826304644346237, "value_bot": 0.006633507087826729, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00655.png", "entropy": 0.6952702403068542} +{"ts": "2026-01-29T21:39:01.830008Z", "loop": 660, "env_steps": 405504000, "exact_value_avg": 0.31139570474624634, "regret_dist": 0.4923816919326782, "regret_other_env": 0.7613089084625244, "regret_corner": 0.08899086713790894, "regret_row": 0.5915863513946533, "regret_any": 0.7613089084625244, "regret_bot": 0.7897671461105347, "value_dist": 0.31139570474624634, "value_other_env": 0.06824421137571335, "value_corner": 0.6761229038238525, "value_row": 0.20510265231132507, "value_any": 0.06824421137571335, "value_bot": 0.0069218953140079975, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00660.png", "entropy": 0.694743275642395} +{"ts": "2026-01-29T21:39:07.695635Z", "loop": 665, "env_steps": 408576000, "exact_value_avg": 0.3115037679672241, "regret_dist": 0.49227356910705566, "regret_other_env": 0.7613089084625244, "regret_corner": 0.08872053027153015, "regret_row": 0.5887733697891235, "regret_any": 0.7613089084625244, "regret_bot": 0.789964497089386, "value_dist": 0.3115037679672241, "value_other_env": 0.06824420392513275, "value_corner": 0.6763931512832642, "value_row": 0.20791569352149963, "value_any": 0.06824420392513275, "value_bot": 0.006724518723785877, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00665.png", "entropy": 0.6948429346084595} +{"ts": "2026-01-29T21:39:13.543832Z", "loop": 670, "env_steps": 411648000, "exact_value_avg": 0.31151843070983887, "regret_dist": 0.4922589659690857, "regret_other_env": 0.7613043189048767, "regret_corner": 0.0886908546090126, "regret_row": 0.5858166217803955, "regret_any": 0.7613043189048767, "regret_bot": 0.7901641726493835, "value_dist": 0.31151843070983887, "value_other_env": 0.06824874132871628, "value_corner": 0.6764228940010071, "value_row": 0.21087238192558289, "value_any": 0.06824874132871628, "value_bot": 0.006524877622723579, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00670.png", "entropy": 0.694750189781189} +{"ts": "2026-01-29T21:39:19.406137Z", "loop": 675, "env_steps": 414720000, "exact_value_avg": 0.31149619817733765, "regret_dist": 0.4922811985015869, "regret_other_env": 0.7613094449043274, "regret_corner": 0.0887388214468956, "regret_row": 0.5842452645301819, "regret_any": 0.7613094449043274, "regret_bot": 0.7902686595916748, "value_dist": 0.31149619817733765, "value_other_env": 0.06824368238449097, "value_corner": 0.6763749122619629, "value_row": 0.21244385838508606, "value_any": 0.06824368238449097, "value_bot": 0.00642036646604538, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00675.png", "entropy": 0.6945681571960449} +{"ts": "2026-01-29T21:39:25.260963Z", "loop": 680, "env_steps": 417792000, "exact_value_avg": 0.31155964732170105, "regret_dist": 0.4922177791595459, "regret_other_env": 0.7613111138343811, "regret_corner": 0.08857771754264832, "regret_row": 0.5870082974433899, "regret_any": 0.7613111138343811, "regret_bot": 0.7900872230529785, "value_dist": 0.31155964732170105, "value_other_env": 0.06824200600385666, "value_corner": 0.6765360832214355, "value_row": 0.20968076586723328, "value_any": 0.06824200600385666, "value_bot": 0.006601826287806034, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00680.png", "entropy": 0.6947689652442932} +{"ts": "2026-01-29T21:39:31.103767Z", "loop": 685, "env_steps": 420864000, "exact_value_avg": 0.3114817142486572, "regret_dist": 0.49229565262794495, "regret_other_env": 0.7613160610198975, "regret_corner": 0.08876503258943558, "regret_row": 0.5831702947616577, "regret_any": 0.7613160610198975, "regret_bot": 0.7903425693511963, "value_dist": 0.3114817142486572, "value_other_env": 0.06823703646659851, "value_corner": 0.6763487458229065, "value_row": 0.21351881325244904, "value_any": 0.06823703646659851, "value_bot": 0.006346464157104492, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00685.png", "entropy": 0.6943981051445007} +{"ts": "2026-01-29T21:39:36.950155Z", "loop": 690, "env_steps": 423936000, "exact_value_avg": 0.31157663464546204, "regret_dist": 0.49220073223114014, "regret_other_env": 0.7613180875778198, "regret_corner": 0.08852466195821762, "regret_row": 0.5891380906105042, "regret_any": 0.7613180875778198, "regret_bot": 0.7899463772773743, "value_dist": 0.31157663464546204, "value_other_env": 0.06823501735925674, "value_corner": 0.6765890717506409, "value_row": 0.20755094289779663, "value_any": 0.06823501735925674, "value_bot": 0.006742744706571102, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00690.png", "entropy": 0.6946913599967957} +{"ts": "2026-01-29T21:39:42.799080Z", "loop": 695, "env_steps": 427008000, "exact_value_avg": 0.3115960657596588, "regret_dist": 0.49218133091926575, "regret_other_env": 0.7613198161125183, "regret_corner": 0.08847354352474213, "regret_row": 0.585955798625946, "regret_any": 0.7613198161125183, "regret_bot": 0.7901631593704224, "value_dist": 0.3115960657596588, "value_other_env": 0.06823329627513885, "value_corner": 0.6766402125358582, "value_row": 0.21073324978351593, "value_any": 0.06823329627513885, "value_bot": 0.006526044569909573, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00695.png", "entropy": 0.694614827632904} +{"ts": "2026-01-29T21:39:48.641704Z", "loop": 700, "env_steps": 430080000, "exact_value_avg": 0.3108939528465271, "regret_dist": 0.49288344383239746, "regret_other_env": 0.7613686323165894, "regret_corner": 0.09015558660030365, "regret_row": 0.5756663084030151, "regret_any": 0.7613686323165894, "regret_bot": 0.7908253073692322, "value_dist": 0.3108939528465271, "value_other_env": 0.0681845173239708, "value_corner": 0.6749580502510071, "value_row": 0.22102276980876923, "value_any": 0.0681845173239708, "value_bot": 0.005863738711923361, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00700.png", "entropy": 0.6919510364532471} +{"ts": "2026-01-29T21:39:54.492946Z", "loop": 705, "env_steps": 433152000, "exact_value_avg": 0.31163161993026733, "regret_dist": 0.4921457767486572, "regret_other_env": 0.7613241672515869, "regret_corner": 0.08837811648845673, "regret_row": 0.5859370231628418, "regret_any": 0.7613241672515869, "regret_bot": 0.7901688814163208, "value_dist": 0.31163161993026733, "value_other_env": 0.06822896748781204, "value_corner": 0.6767355799674988, "value_row": 0.21075206995010376, "value_any": 0.06822896748781204, "value_bot": 0.006520195864140987, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00705.png", "entropy": 0.6945555806159973} +{"ts": "2026-01-29T21:40:00.340094Z", "loop": 710, "env_steps": 436224000, "exact_value_avg": 0.31120187044143677, "regret_dist": 0.4925754964351654, "regret_other_env": 0.7613707780838013, "regret_corner": 0.08938255906105042, "regret_row": 0.5970324873924255, "regret_any": 0.7613707780838013, "regret_bot": 0.7894003987312317, "value_dist": 0.31120187044143677, "value_other_env": 0.06818227469921112, "value_corner": 0.6757311820983887, "value_row": 0.1996566206216812, "value_any": 0.06818227469921112, "value_bot": 0.007288701366633177, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00710.png", "entropy": 0.6929556727409363} +{"ts": "2026-01-29T21:40:06.181541Z", "loop": 715, "env_steps": 439296000, "exact_value_avg": 0.3116276264190674, "regret_dist": 0.4921497404575348, "regret_other_env": 0.7613372802734375, "regret_corner": 0.08836838603019714, "regret_row": 0.5841377973556519, "regret_any": 0.7613372802734375, "regret_bot": 0.7902928590774536, "value_dist": 0.3116276264190674, "value_other_env": 0.06821583211421967, "value_corner": 0.6767452955245972, "value_row": 0.21255117654800415, "value_any": 0.06821583211421967, "value_bot": 0.006396114360541105, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00715.png", "entropy": 0.6942728161811829} +{"ts": "2026-01-29T21:40:12.022516Z", "loop": 720, "env_steps": 442368000, "exact_value_avg": 0.31146034598350525, "regret_dist": 0.4923170506954193, "regret_other_env": 0.7613415122032166, "regret_corner": 0.08878032863140106, "regret_row": 0.5806307792663574, "regret_any": 0.7613415122032166, "regret_bot": 0.7905197143554688, "value_dist": 0.31146034598350525, "value_other_env": 0.06821160763502121, "value_corner": 0.6763334274291992, "value_row": 0.21605831384658813, "value_any": 0.06821160763502121, "value_bot": 0.006169311702251434, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00720.png", "entropy": 0.6937216520309448} +{"ts": "2026-01-29T21:40:17.866240Z", "loop": 725, "env_steps": 445440000, "exact_value_avg": 0.31168273091316223, "regret_dist": 0.49209463596343994, "regret_other_env": 0.7613240480422974, "regret_corner": 0.08825051784515381, "regret_row": 0.5901795029640198, "regret_any": 0.7613240480422974, "regret_bot": 0.7898868322372437, "value_dist": 0.31168273091316223, "value_other_env": 0.068229079246521, "value_corner": 0.6768631935119629, "value_row": 0.2065095752477646, "value_any": 0.068229079246521, "value_bot": 0.006802251096814871, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00725.png", "entropy": 0.6947370767593384} +{"ts": "2026-01-29T21:40:23.713856Z", "loop": 730, "env_steps": 448512000, "exact_value_avg": 0.31161120533943176, "regret_dist": 0.4921662211418152, "regret_other_env": 0.7613319158554077, "regret_corner": 0.08841758221387863, "regret_row": 0.5825124382972717, "regret_any": 0.7613319158554077, "regret_bot": 0.7904013395309448, "value_dist": 0.31161120533943176, "value_other_env": 0.06822119653224945, "value_corner": 0.6766961812973022, "value_row": 0.21417661011219025, "value_any": 0.06822119653224945, "value_bot": 0.00628765020519495, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00730.png", "entropy": 0.6942470073699951} +{"ts": "2026-01-29T21:40:29.561745Z", "loop": 735, "env_steps": 451584000, "exact_value_avg": 0.3116723299026489, "regret_dist": 0.492105096578598, "regret_other_env": 0.7613213062286377, "regret_corner": 0.08828071504831314, "regret_row": 0.5829147696495056, "regret_any": 0.7613213062286377, "regret_bot": 0.7903761267662048, "value_dist": 0.3116723299026489, "value_other_env": 0.06823185831308365, "value_corner": 0.6768329739570618, "value_row": 0.21377426385879517, "value_any": 0.06823185831308365, "value_bot": 0.006312948185950518, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00735.png", "entropy": 0.6942248344421387} +{"ts": "2026-01-29T21:40:35.405931Z", "loop": 740, "env_steps": 454656000, "exact_value_avg": 0.3117672801017761, "regret_dist": 0.4920101761817932, "regret_other_env": 0.7613348960876465, "regret_corner": 0.08802298456430435, "regret_row": 0.5902554988861084, "regret_any": 0.7613348960876465, "regret_bot": 0.7898920774459839, "value_dist": 0.3117672801017761, "value_other_env": 0.06821827590465546, "value_corner": 0.6770907640457153, "value_row": 0.20643360912799835, "value_any": 0.06821827590465546, "value_bot": 0.00679695513099432, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00740.png", "entropy": 0.6945430040359497} +{"ts": "2026-01-29T21:40:41.246415Z", "loop": 745, "env_steps": 457728000, "exact_value_avg": 0.31181222200393677, "regret_dist": 0.4919651746749878, "regret_other_env": 0.7613471150398254, "regret_corner": 0.08789221942424774, "regret_row": 0.58596271276474, "regret_any": 0.7613471150398254, "regret_bot": 0.7901844382286072, "value_dist": 0.31181222200393677, "value_other_env": 0.06820597499608994, "value_corner": 0.6772215366363525, "value_row": 0.21072635054588318, "value_any": 0.06820597499608994, "value_bot": 0.006504641845822334, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00745.png", "entropy": 0.6945527791976929} +{"ts": "2026-01-29T21:40:47.089024Z", "loop": 750, "env_steps": 460800000, "exact_value_avg": 0.3117983937263489, "regret_dist": 0.4919790029525757, "regret_other_env": 0.7613477110862732, "regret_corner": 0.08792584389448166, "regret_row": 0.5843116641044617, "regret_any": 0.7613477110862732, "regret_bot": 0.7902939319610596, "value_dist": 0.3117983937263489, "value_other_env": 0.06820537149906158, "value_corner": 0.6771879196166992, "value_row": 0.2123773843050003, "value_any": 0.06820537149906158, "value_bot": 0.00639519514515996, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00750.png", "entropy": 0.6944209933280945} +{"ts": "2026-01-29T21:40:52.938923Z", "loop": 755, "env_steps": 463872000, "exact_value_avg": 0.31186267733573914, "regret_dist": 0.49191465973854065, "regret_other_env": 0.7613524198532104, "regret_corner": 0.08775801956653595, "regret_row": 0.5895697474479675, "regret_any": 0.7613524198532104, "regret_bot": 0.7899469137191772, "value_dist": 0.31186267733573914, "value_other_env": 0.06820064038038254, "value_corner": 0.6773557662963867, "value_row": 0.20711937546730042, "value_any": 0.06820064038038254, "value_bot": 0.006742146797478199, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00755.png", "entropy": 0.6946989893913269} +{"ts": "2026-01-29T21:40:58.777177Z", "loop": 760, "env_steps": 466944000, "exact_value_avg": 0.3118884563446045, "regret_dist": 0.49188899993896484, "regret_other_env": 0.7613542675971985, "regret_corner": 0.0876910537481308, "regret_row": 0.5899458527565002, "regret_any": 0.7613542675971985, "regret_bot": 0.7899235486984253, "value_dist": 0.3118884563446045, "value_other_env": 0.06819893419742584, "value_corner": 0.6774227023124695, "value_row": 0.2067432403564453, "value_any": 0.06819893419742584, "value_bot": 0.006765551865100861, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00760.png", "entropy": 0.6947812438011169} +{"ts": "2026-01-29T21:41:04.618051Z", "loop": 765, "env_steps": 470016000, "exact_value_avg": 0.3115653395652771, "regret_dist": 0.4922119975090027, "regret_other_env": 0.7613762021064758, "regret_corner": 0.08846566081047058, "regret_row": 0.5792956352233887, "regret_any": 0.7613762021064758, "regret_bot": 0.7906240224838257, "value_dist": 0.3115653395652771, "value_other_env": 0.06817691028118134, "value_corner": 0.6766480207443237, "value_row": 0.2173934429883957, "value_any": 0.06817691028118134, "value_bot": 0.006065002176910639, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00765.png", "entropy": 0.6933498382568359} +{"ts": "2026-01-29T21:41:10.460568Z", "loop": 770, "env_steps": 473088000, "exact_value_avg": 0.31181392073631287, "regret_dist": 0.4919634759426117, "regret_other_env": 0.7613694071769714, "regret_corner": 0.08785456418991089, "regret_row": 0.5934897661209106, "regret_any": 0.7613694071769714, "regret_bot": 0.7896894812583923, "value_dist": 0.31181392073631287, "value_other_env": 0.06818373501300812, "value_corner": 0.6772591471672058, "value_row": 0.2031993269920349, "value_any": 0.06818373501300812, "value_bot": 0.00699955690652132, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00770.png", "entropy": 0.6941460967063904} +{"ts": "2026-01-29T21:41:16.320609Z", "loop": 775, "env_steps": 476160000, "exact_value_avg": 0.3119947016239166, "regret_dist": 0.49178266525268555, "regret_other_env": 0.7613687515258789, "regret_corner": 0.08740349858999252, "regret_row": 0.5904128551483154, "regret_any": 0.7613687515258789, "regret_bot": 0.7899044752120972, "value_dist": 0.3119947016239166, "value_other_env": 0.06818433105945587, "value_corner": 0.677710235118866, "value_row": 0.20627620816230774, "value_any": 0.06818433105945587, "value_bot": 0.006784582044929266, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00775.png", "entropy": 0.6945232152938843} +{"ts": "2026-01-29T21:41:22.181004Z", "loop": 780, "env_steps": 479232000, "exact_value_avg": 0.3118421733379364, "regret_dist": 0.49193525314331055, "regret_other_env": 0.7613677382469177, "regret_corner": 0.08778644353151321, "regret_row": 0.5813131332397461, "regret_any": 0.7613677382469177, "regret_bot": 0.7905012369155884, "value_dist": 0.3118421733379364, "value_other_env": 0.06818536669015884, "value_corner": 0.6773273348808289, "value_row": 0.2153758853673935, "value_any": 0.06818536669015884, "value_bot": 0.006187845021486282, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00780.png", "entropy": 0.6936764717102051} +{"ts": "2026-01-29T21:41:28.035514Z", "loop": 785, "env_steps": 482304000, "exact_value_avg": 0.31207597255706787, "regret_dist": 0.4917013943195343, "regret_other_env": 0.7613686919212341, "regret_corner": 0.08720042556524277, "regret_row": 0.5853330492973328, "regret_any": 0.7613686919212341, "regret_bot": 0.7902491688728333, "value_dist": 0.31207597255706787, "value_other_env": 0.06818440556526184, "value_corner": 0.6779133081436157, "value_row": 0.2113559991121292, "value_any": 0.06818440556526184, "value_bot": 0.006439880467951298, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00785.png", "entropy": 0.6943690776824951} +{"ts": "2026-01-29T21:41:33.885366Z", "loop": 790, "env_steps": 485376000, "exact_value_avg": 0.3121459186077118, "regret_dist": 0.4916314482688904, "regret_other_env": 0.7613747715950012, "regret_corner": 0.08701646327972412, "regret_row": 0.5899547338485718, "regret_any": 0.7613747715950012, "regret_bot": 0.7899453639984131, "value_dist": 0.3121459186077118, "value_other_env": 0.06817831844091415, "value_corner": 0.6780973076820374, "value_row": 0.20673437416553497, "value_any": 0.06817831844091415, "value_bot": 0.006743744481354952, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00790.png", "entropy": 0.6944509744644165} +{"ts": "2026-01-29T21:41:39.742062Z", "loop": 795, "env_steps": 488448000, "exact_value_avg": 0.31219229102134705, "regret_dist": 0.4915851056575775, "regret_other_env": 0.7613763213157654, "regret_corner": 0.08689820766448975, "regret_row": 0.5903068780899048, "regret_any": 0.7613763213157654, "regret_bot": 0.7899258732795715, "value_dist": 0.31219229102134705, "value_other_env": 0.06817677617073059, "value_corner": 0.6782155632972717, "value_row": 0.20638221502304077, "value_any": 0.06817677617073059, "value_bot": 0.006763228215277195, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00795.png", "entropy": 0.69451904296875} +{"ts": "2026-01-29T21:41:45.586188Z", "loop": 800, "env_steps": 491520000, "exact_value_avg": 0.31219691038131714, "regret_dist": 0.49158045649528503, "regret_other_env": 0.761385977268219, "regret_corner": 0.0868721529841423, "regret_row": 0.5922688841819763, "regret_any": 0.761385977268219, "regret_bot": 0.789797306060791, "value_dist": 0.31219691038131714, "value_other_env": 0.06816713511943817, "value_corner": 0.6782415509223938, "value_row": 0.2044200897216797, "value_any": 0.06816713511943817, "value_bot": 0.006891715805977583, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00800.png", "entropy": 0.6943522095680237} +{"ts": "2026-01-29T21:41:51.426690Z", "loop": 805, "env_steps": 494592000, "exact_value_avg": 0.3123462200164795, "regret_dist": 0.49143117666244507, "regret_other_env": 0.7613836526870728, "regret_corner": 0.08650244027376175, "regret_row": 0.5885109901428223, "regret_any": 0.7613836526870728, "regret_bot": 0.7900582551956177, "value_dist": 0.3123462200164795, "value_other_env": 0.0681694820523262, "value_corner": 0.6786112785339355, "value_row": 0.20817802846431732, "value_any": 0.0681694820523262, "value_bot": 0.0066308085806667805, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00805.png", "entropy": 0.6945675015449524} +{"ts": "2026-01-29T21:41:57.275112Z", "loop": 810, "env_steps": 497664000, "exact_value_avg": 0.3123002052307129, "regret_dist": 0.4914771318435669, "regret_other_env": 0.7613968849182129, "regret_corner": 0.08659739792346954, "regret_row": 0.5933802723884583, "regret_any": 0.7613968849182129, "regret_bot": 0.7897332310676575, "value_dist": 0.3123002052307129, "value_other_env": 0.06815619766712189, "value_corner": 0.6785162687301636, "value_row": 0.20330877602100372, "value_any": 0.06815619766712189, "value_bot": 0.006955854594707489, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00810.png", "entropy": 0.6940004229545593} +{"ts": "2026-01-29T21:42:03.115649Z", "loop": 815, "env_steps": 500736000, "exact_value_avg": 0.31235313415527344, "regret_dist": 0.49142423272132874, "regret_other_env": 0.7614084482192993, "regret_corner": 0.08644787967205048, "regret_row": 0.583207368850708, "regret_any": 0.7614084482192993, "regret_bot": 0.790421724319458, "value_dist": 0.31235313415527344, "value_other_env": 0.06814465671777725, "value_corner": 0.678665816783905, "value_row": 0.21348163485527039, "value_any": 0.06814465671777725, "value_bot": 0.006267431657761335, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00815.png", "entropy": 0.6938011646270752} +{"ts": "2026-01-29T21:42:08.963674Z", "loop": 820, "env_steps": 503808000, "exact_value_avg": 0.31152111291885376, "regret_dist": 0.4922562539577484, "regret_other_env": 0.7614770531654358, "regret_corner": 0.08842497318983078, "regret_row": 0.5744547843933105, "regret_any": 0.7614770531654358, "regret_bot": 0.790969729423523, "value_dist": 0.31152111291885376, "value_other_env": 0.06807597726583481, "value_corner": 0.6766887307167053, "value_row": 0.22223424911499023, "value_any": 0.06807597726583481, "value_bot": 0.005719262175261974, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00820.png", "entropy": 0.6905915141105652} +{"ts": "2026-01-29T21:42:14.810329Z", "loop": 825, "env_steps": 506880000, "exact_value_avg": 0.3123970031738281, "regret_dist": 0.49138039350509644, "regret_other_env": 0.7614051103591919, "regret_corner": 0.08634329587221146, "regret_row": 0.5810319185256958, "regret_any": 0.7614051103591919, "regret_bot": 0.7905679941177368, "value_dist": 0.3123970031738281, "value_other_env": 0.06814803183078766, "value_corner": 0.6787704825401306, "value_row": 0.21565714478492737, "value_any": 0.06814803183078766, "value_bot": 0.006121096201241016, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00825.png", "entropy": 0.693221926689148} +{"ts": "2026-01-29T21:42:20.655304Z", "loop": 830, "env_steps": 509952000, "exact_value_avg": 0.3113969564437866, "regret_dist": 0.49238044023513794, "regret_other_env": 0.76144939661026, "regret_corner": 0.08877692371606827, "regret_row": 0.604039192199707, "regret_any": 0.76144939661026, "regret_bot": 0.7889647483825684, "value_dist": 0.3113969564437866, "value_other_env": 0.06810370087623596, "value_corner": 0.6763368248939514, "value_row": 0.19264988601207733, "value_any": 0.06810370087623596, "value_bot": 0.0077243284322321415, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00830.png", "entropy": 0.6900179982185364} +{"ts": "2026-01-29T21:42:26.507704Z", "loop": 835, "env_steps": 513024000, "exact_value_avg": 0.31288477778434753, "regret_dist": 0.49089258909225464, "regret_other_env": 0.7614099383354187, "regret_corner": 0.08511658757925034, "regret_row": 0.5894794464111328, "regret_any": 0.7614099383354187, "regret_bot": 0.7900336980819702, "value_dist": 0.31288477778434753, "value_other_env": 0.06814320385456085, "value_corner": 0.6799971461296082, "value_row": 0.20720963180065155, "value_any": 0.06814320385456085, "value_bot": 0.006655458826571703, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00835.png", "entropy": 0.6941538453102112} +{"ts": "2026-01-29T21:42:32.354658Z", "loop": 840, "env_steps": 516096000, "exact_value_avg": 0.3122991621494293, "regret_dist": 0.49147820472717285, "regret_other_env": 0.7614653706550598, "regret_corner": 0.0864974707365036, "regret_row": 0.577559769153595, "regret_any": 0.7614653706550598, "regret_bot": 0.7908044457435608, "value_dist": 0.3122991621494293, "value_other_env": 0.06808776408433914, "value_corner": 0.6786162257194519, "value_row": 0.2191292941570282, "value_any": 0.06808776408433914, "value_bot": 0.005884577054530382, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00840.png", "entropy": 0.691727876663208} +{"ts": "2026-01-29T21:42:38.198062Z", "loop": 845, "env_steps": 519168000, "exact_value_avg": 0.3129971921443939, "regret_dist": 0.49078017473220825, "regret_other_env": 0.7614476084709167, "regret_corner": 0.08477894961833954, "regret_row": 0.5942627191543579, "regret_any": 0.7614476084709167, "regret_bot": 0.789732038974762, "value_dist": 0.3129971921443939, "value_other_env": 0.06810545921325684, "value_corner": 0.680334746837616, "value_row": 0.20242634415626526, "value_any": 0.06810545921325684, "value_bot": 0.006957057397812605, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00845.png", "entropy": 0.6935309767723083} +{"ts": "2026-01-29T21:42:44.043835Z", "loop": 850, "env_steps": 522240000, "exact_value_avg": 0.3120160400867462, "regret_dist": 0.49176132678985596, "regret_other_env": 0.761551558971405, "regret_corner": 0.08707593381404877, "regret_row": 0.6052401065826416, "regret_any": 0.761551558971405, "regret_bot": 0.7889556884765625, "value_dist": 0.3120160400867462, "value_other_env": 0.06800153851509094, "value_corner": 0.6780377626419067, "value_row": 0.19144892692565918, "value_any": 0.06800153851509094, "value_bot": 0.007733447477221489, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00850.png", "entropy": 0.6891919374465942} +{"ts": "2026-01-29T21:42:49.885296Z", "loop": 855, "env_steps": 525312000, "exact_value_avg": 0.3121451735496521, "regret_dist": 0.4916321933269501, "regret_other_env": 0.7615147233009338, "regret_corner": 0.08680838346481323, "regret_row": 0.5743606686592102, "regret_any": 0.7615147233009338, "regret_bot": 0.7910183668136597, "value_dist": 0.3121451735496521, "value_other_env": 0.06803837418556213, "value_corner": 0.6783053278923035, "value_row": 0.22232836484909058, "value_any": 0.06803837418556213, "value_bot": 0.005670706741511822, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00855.png", "entropy": 0.6898850202560425} +{"ts": "2026-01-29T21:42:55.728071Z", "loop": 860, "env_steps": 528384000, "exact_value_avg": 0.3133881092071533, "regret_dist": 0.49038925766944885, "regret_other_env": 0.7614357471466064, "regret_corner": 0.08381947129964828, "regret_row": 0.5943363904953003, "regret_any": 0.7614357471466064, "regret_bot": 0.7897577881813049, "value_dist": 0.3133881092071533, "value_other_env": 0.06811732053756714, "value_corner": 0.6812942624092102, "value_row": 0.20235267281532288, "value_any": 0.06811732053756714, "value_bot": 0.006931268610060215, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00860.png", "entropy": 0.6935827732086182} +{"ts": "2026-01-29T21:43:01.577478Z", "loop": 865, "env_steps": 531456000, "exact_value_avg": 0.3130682110786438, "regret_dist": 0.490709125995636, "regret_other_env": 0.7614960074424744, "regret_corner": 0.08452876657247543, "regret_row": 0.60068678855896, "regret_any": 0.7614960074424744, "regret_bot": 0.789333164691925, "value_dist": 0.3130682110786438, "value_other_env": 0.06805702298879623, "value_corner": 0.6805849671363831, "value_row": 0.19600218534469604, "value_any": 0.06805702298879623, "value_bot": 0.007355905137956142, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00865.png", "entropy": 0.6917896270751953} +{"ts": "2026-01-29T21:43:07.429028Z", "loop": 870, "env_steps": 534528000, "exact_value_avg": 0.3137659430503845, "regret_dist": 0.4900114834308624, "regret_other_env": 0.7614613175392151, "regret_corner": 0.08283668756484985, "regret_row": 0.5870621800422668, "regret_any": 0.7614613175392151, "regret_bot": 0.7902789115905762, "value_dist": 0.3137659430503845, "value_other_env": 0.06809182465076447, "value_corner": 0.6822770833969116, "value_row": 0.20962685346603394, "value_any": 0.06809182465076447, "value_bot": 0.0064101433381438255, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00870.png", "entropy": 0.6938584446907043} +{"ts": "2026-01-29T21:43:13.281799Z", "loop": 875, "env_steps": 537600000, "exact_value_avg": 0.31405022740364075, "regret_dist": 0.4897271692752838, "regret_other_env": 0.7614595890045166, "regret_corner": 0.08212852478027344, "regret_row": 0.5908048152923584, "regret_any": 0.7614595890045166, "regret_bot": 0.7900518774986267, "value_dist": 0.31405022740364075, "value_other_env": 0.06809357553720474, "value_corner": 0.6829851865768433, "value_row": 0.20588429272174835, "value_any": 0.06809357553720474, "value_bot": 0.006637197453528643, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00875.png", "entropy": 0.6937865018844604} +{"ts": "2026-01-29T21:43:19.131240Z", "loop": 880, "env_steps": 540672000, "exact_value_avg": 0.31432026624679565, "regret_dist": 0.4894571006298065, "regret_other_env": 0.7614617347717285, "regret_corner": 0.08145014941692352, "regret_row": 0.5900310277938843, "regret_any": 0.7614617347717285, "regret_bot": 0.7901206016540527, "value_dist": 0.31432026624679565, "value_other_env": 0.06809135526418686, "value_corner": 0.6836636066436768, "value_row": 0.2066580057144165, "value_any": 0.06809135526418686, "value_bot": 0.00656842952594161, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00880.png", "entropy": 0.693597674369812} +{"ts": "2026-01-29T21:43:24.979284Z", "loop": 885, "env_steps": 543744000, "exact_value_avg": 0.31447452306747437, "regret_dist": 0.4893028736114502, "regret_other_env": 0.7614715695381165, "regret_corner": 0.0810498371720314, "regret_row": 0.5861754417419434, "regret_any": 0.7614715695381165, "regret_bot": 0.7903890609741211, "value_dist": 0.31447452306747437, "value_other_env": 0.0680815577507019, "value_corner": 0.6840639114379883, "value_row": 0.21051357686519623, "value_any": 0.0680815577507019, "value_bot": 0.006299987435340881, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00885.png", "entropy": 0.6930688619613647} +{"ts": "2026-01-29T21:43:30.826322Z", "loop": 890, "env_steps": 546816000, "exact_value_avg": 0.3143051564693451, "regret_dist": 0.4894722104072571, "regret_other_env": 0.7614879608154297, "regret_corner": 0.08144855499267578, "regret_row": 0.6033744215965271, "regret_any": 0.7614879608154297, "regret_bot": 0.789247453212738, "value_dist": 0.3143051564693451, "value_other_env": 0.06806513667106628, "value_corner": 0.6836651563644409, "value_row": 0.19331462681293488, "value_any": 0.06806513667106628, "value_bot": 0.007441602647304535, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00890.png", "entropy": 0.6901592016220093} +{"ts": "2026-01-29T21:43:36.674325Z", "loop": 895, "env_steps": 549888000, "exact_value_avg": 0.3153567910194397, "regret_dist": 0.4884205758571625, "regret_other_env": 0.7614876627922058, "regret_corner": 0.07881991565227509, "regret_row": 0.5914506316184998, "regret_any": 0.7614876627922058, "regret_bot": 0.7901309728622437, "value_dist": 0.3153567910194397, "value_other_env": 0.06806540489196777, "value_corner": 0.6862938404083252, "value_row": 0.2052384316921234, "value_any": 0.06806540489196777, "value_bot": 0.006558124907314777, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00895.png", "entropy": 0.6926689743995667} +{"ts": "2026-01-29T21:43:42.516611Z", "loop": 900, "env_steps": 552960000, "exact_value_avg": 0.31569892168045044, "regret_dist": 0.4880785048007965, "regret_other_env": 0.7614717483520508, "regret_corner": 0.07798855006694794, "regret_row": 0.5890175104141235, "regret_any": 0.7614717483520508, "regret_bot": 0.7903184294700623, "value_dist": 0.31569892168045044, "value_other_env": 0.06808135658502579, "value_corner": 0.6871252059936523, "value_row": 0.20767150819301605, "value_any": 0.06808135658502579, "value_bot": 0.006370676215738058, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00900.png", "entropy": 0.6922534108161926} +{"ts": "2026-01-29T21:43:48.356381Z", "loop": 905, "env_steps": 556032000, "exact_value_avg": 0.31521886587142944, "regret_dist": 0.48855847120285034, "regret_other_env": 0.7614582777023315, "regret_corner": 0.07920869439840317, "regret_row": 0.6078298687934875, "regret_any": 0.7614582777023315, "regret_bot": 0.7890280485153198, "value_dist": 0.31521886587142944, "value_other_env": 0.06809478998184204, "value_corner": 0.6859049797058105, "value_row": 0.18885920941829681, "value_any": 0.06809478998184204, "value_bot": 0.007660993374884129, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00905.png", "entropy": 0.6874856352806091} +{"ts": "2026-01-29T21:43:54.203306Z", "loop": 910, "env_steps": 559104000, "exact_value_avg": 0.31672653555870056, "regret_dist": 0.4870508313179016, "regret_other_env": 0.7614210844039917, "regret_corner": 0.07549542188644409, "regret_row": 0.5908096432685852, "regret_any": 0.7614210844039917, "regret_bot": 0.7902582287788391, "value_dist": 0.31672653555870056, "value_other_env": 0.06813202798366547, "value_corner": 0.6896182894706726, "value_row": 0.2058793604373932, "value_any": 0.06813202798366547, "value_bot": 0.0064308252185583115, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00910.png", "entropy": 0.6915876269340515} +{"ts": "2026-01-29T21:44:00.045541Z", "loop": 915, "env_steps": 562176000, "exact_value_avg": 0.31739428639411926, "regret_dist": 0.4863830804824829, "regret_other_env": 0.7613500356674194, "regret_corner": 0.07393262535333633, "regret_row": 0.5990148186683655, "regret_any": 0.7613500356674194, "regret_bot": 0.7897418141365051, "value_dist": 0.31739428639411926, "value_other_env": 0.06820309162139893, "value_corner": 0.6911810636520386, "value_row": 0.1976742148399353, "value_any": 0.06820309162139893, "value_bot": 0.006947244051843882, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00915.png", "entropy": 0.6904400587081909} +{"ts": "2026-01-29T21:44:05.887331Z", "loop": 920, "env_steps": 565248000, "exact_value_avg": 0.31816136837005615, "regret_dist": 0.4856160283088684, "regret_other_env": 0.7613556385040283, "regret_corner": 0.07200659811496735, "regret_row": 0.5923306345939636, "regret_any": 0.7613556385040283, "regret_bot": 0.7902524471282959, "value_dist": 0.31816136837005615, "value_other_env": 0.06819749623537064, "value_corner": 0.6931071281433105, "value_row": 0.20435845851898193, "value_any": 0.06819749623537064, "value_bot": 0.006436697207391262, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00920.png", "entropy": 0.6902628540992737} +{"ts": "2026-01-29T21:44:11.731949Z", "loop": 925, "env_steps": 568320000, "exact_value_avg": 0.3191163241863251, "regret_dist": 0.4846610724925995, "regret_other_env": 0.7612918615341187, "regret_corner": 0.06971486657857895, "regret_row": 0.6044113636016846, "regret_any": 0.7612918615341187, "regret_bot": 0.7895023226737976, "value_dist": 0.3191163241863251, "value_other_env": 0.06826125830411911, "value_corner": 0.6953988671302795, "value_row": 0.192277729511261, "value_any": 0.06826125830411911, "value_bot": 0.007186722010374069, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00925.png", "entropy": 0.6873332262039185} +{"ts": "2026-01-29T21:44:17.584906Z", "loop": 930, "env_steps": 571392000, "exact_value_avg": 0.31946176290512085, "regret_dist": 0.4843156337738037, "regret_other_env": 0.7613961100578308, "regret_corner": 0.06869489699602127, "regret_row": 0.584560751914978, "regret_any": 0.7613961100578308, "regret_bot": 0.7909125685691833, "value_dist": 0.31946176290512085, "value_other_env": 0.06815700232982635, "value_corner": 0.6964188814163208, "value_row": 0.21212829649448395, "value_any": 0.06815700232982635, "value_bot": 0.005776525940746069, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00930.png", "entropy": 0.6849147081375122} +{"ts": "2026-01-29T21:44:23.436100Z", "loop": 935, "env_steps": 574464000, "exact_value_avg": 0.32117754220962524, "regret_dist": 0.4825998842716217, "regret_other_env": 0.7611755728721619, "regret_corner": 0.06473628431558609, "regret_row": 0.6150416135787964, "regret_any": 0.7611755728721619, "regret_bot": 0.7889418601989746, "value_dist": 0.32117754220962524, "value_other_env": 0.06837758421897888, "value_corner": 0.7003774642944336, "value_row": 0.1816474348306656, "value_any": 0.06837758421897888, "value_bot": 0.007747143507003784, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00935.png", "entropy": 0.6795226335525513} +{"ts": "2026-01-29T21:44:29.278807Z", "loop": 940, "env_steps": 577536000, "exact_value_avg": 0.32284054160118103, "regret_dist": 0.48093682527542114, "regret_other_env": 0.761258602142334, "regret_corner": 0.060454100370407104, "regret_row": 0.5925343632698059, "regret_any": 0.761258602142334, "regret_bot": 0.7906719446182251, "value_dist": 0.32284054160118103, "value_other_env": 0.06829444319009781, "value_corner": 0.704659640789032, "value_row": 0.20415472984313965, "value_any": 0.06829444319009781, "value_bot": 0.006017112638801336, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00940.png", "entropy": 0.6803978681564331} +{"ts": "2026-01-29T21:44:35.121929Z", "loop": 945, "env_steps": 580608000, "exact_value_avg": 0.3252488970756531, "regret_dist": 0.4785284698009491, "regret_other_env": 0.7610266804695129, "regret_corner": 0.054781120270490646, "regret_row": 0.6190049648284912, "regret_any": 0.7610266804695129, "regret_bot": 0.7890086770057678, "value_dist": 0.3252488970756531, "value_other_env": 0.06852640956640244, "value_corner": 0.7103326320648193, "value_row": 0.1776840090751648, "value_any": 0.06852640956640244, "value_bot": 0.0076804086565971375, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00945.png", "entropy": 0.66965252161026} +{"ts": "2026-01-29T21:44:40.964363Z", "loop": 950, "env_steps": 583680000, "exact_value_avg": 0.32760506868362427, "regret_dist": 0.4761722683906555, "regret_other_env": 0.7609201669692993, "regret_corner": 0.04905041307210922, "regret_row": 0.6131131649017334, "regret_any": 0.7609201669692993, "regret_bot": 0.789659321308136, "value_dist": 0.32760506868362427, "value_other_env": 0.06863292306661606, "value_corner": 0.7160632610321045, "value_row": 0.18357591331005096, "value_any": 0.06863292306661606, "value_bot": 0.007029709406197071, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00950.png", "entropy": 0.6662675738334656} +{"ts": "2026-01-29T21:44:46.803241Z", "loop": 955, "env_steps": 586752000, "exact_value_avg": 0.3296034038066864, "regret_dist": 0.47417399287223816, "regret_other_env": 0.7607119083404541, "regret_corner": 0.04436710849404335, "regret_row": 0.6110268235206604, "regret_any": 0.7607119083404541, "regret_bot": 0.789997398853302, "value_dist": 0.3296034038066864, "value_other_env": 0.06884123384952545, "value_corner": 0.720746636390686, "value_row": 0.18566222488880157, "value_any": 0.06884123384952545, "value_bot": 0.006691631395369768, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00955.png", "entropy": 0.6580180525779724} +{"ts": "2026-01-29T21:44:52.656174Z", "loop": 960, "env_steps": 589824000, "exact_value_avg": 0.3316929042339325, "regret_dist": 0.4720844328403473, "regret_other_env": 0.7601915597915649, "regret_corner": 0.03992372378706932, "regret_row": 0.6323534846305847, "regret_any": 0.7601915597915649, "regret_bot": 0.7884935736656189, "value_dist": 0.3316929042339325, "value_other_env": 0.06936150789260864, "value_corner": 0.7251899838447571, "value_row": 0.16433559358119965, "value_any": 0.06936150789260864, "value_bot": 0.008195549249649048, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00960.png", "entropy": 0.6373922228813171} +{"ts": "2026-01-29T21:44:58.499070Z", "loop": 965, "env_steps": 592896000, "exact_value_avg": 0.32978031039237976, "regret_dist": 0.4739970564842224, "regret_other_env": 0.7603581547737122, "regret_corner": 0.04445541650056839, "regret_row": 0.5938858985900879, "regret_any": 0.7603581547737122, "regret_bot": 0.7914581298828125, "value_dist": 0.32978031039237976, "value_other_env": 0.06919494271278381, "value_corner": 0.7206583619117737, "value_row": 0.2028031200170517, "value_any": 0.06919494271278381, "value_bot": 0.005230939015746117, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00965.png", "entropy": 0.6279696226119995} +{"ts": "2026-01-29T21:45:04.343029Z", "loop": 970, "env_steps": 595968000, "exact_value_avg": 0.3288671374320984, "regret_dist": 0.47491025924682617, "regret_other_env": 0.7593058943748474, "regret_corner": 0.04831681400537491, "regret_row": 0.6674338579177856, "regret_any": 0.7593058943748474, "regret_bot": 0.7841998338699341, "value_dist": 0.3288671374320984, "value_other_env": 0.07024723291397095, "value_corner": 0.7167969346046448, "value_row": 0.12925520539283752, "value_any": 0.07024723291397095, "value_bot": 0.012489231303334236, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00970.png", "entropy": 0.539275586605072} +{"ts": "2026-01-29T21:45:10.185273Z", "loop": 975, "env_steps": 599040000, "exact_value_avg": 0.33615440130233765, "regret_dist": 0.4676229655742645, "regret_other_env": 0.7588648200035095, "regret_corner": 0.03076016530394554, "regret_row": 0.6112626791000366, "regret_any": 0.7588648200035095, "regret_bot": 0.7905780076980591, "value_dist": 0.33615440130233765, "value_other_env": 0.07068827748298645, "value_corner": 0.7343535423278809, "value_row": 0.18542636930942535, "value_any": 0.07068827748298645, "value_bot": 0.006111053749918938, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00975.png", "entropy": 0.5868059992790222} +{"ts": "2026-01-29T21:45:16.032308Z", "loop": 980, "env_steps": 602112000, "exact_value_avg": 0.3377986550331116, "regret_dist": 0.4659787118434906, "regret_other_env": 0.7574116587638855, "regret_corner": 0.02882930263876915, "regret_row": 0.6640323400497437, "regret_any": 0.7574116587638855, "regret_bot": 0.7845997214317322, "value_dist": 0.3377986550331116, "value_other_env": 0.07214144617319107, "value_corner": 0.7362844347953796, "value_row": 0.13265672326087952, "value_any": 0.07214144617319107, "value_bot": 0.012089363299310207, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00980.png", "entropy": 0.513243556022644} +{"ts": "2026-01-29T21:45:21.878718Z", "loop": 985, "env_steps": 605184000, "exact_value_avg": 0.3411160707473755, "regret_dist": 0.4626612961292267, "regret_other_env": 0.7567858099937439, "regret_corner": 0.02147451788187027, "regret_row": 0.625855565071106, "regret_any": 0.7567858099937439, "regret_bot": 0.7892078757286072, "value_dist": 0.3411160707473755, "value_other_env": 0.07276729494333267, "value_corner": 0.7436392307281494, "value_row": 0.1708335280418396, "value_any": 0.07276729494333267, "value_bot": 0.007481222040951252, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00985.png", "entropy": 0.5343257784843445} +{"ts": "2026-01-29T21:45:27.732092Z", "loop": 990, "env_steps": 608256000, "exact_value_avg": 0.3441777229309082, "regret_dist": 0.45959967374801636, "regret_other_env": 0.7551447153091431, "regret_corner": 0.01628207415342331, "regret_row": 0.6424094438552856, "regret_any": 0.7551447153091431, "regret_bot": 0.7870101928710938, "value_dist": 0.3441777229309082, "value_other_env": 0.0744083970785141, "value_corner": 0.7488316893577576, "value_row": 0.15427955985069275, "value_any": 0.0744083970785141, "value_bot": 0.009678827598690987, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00990.png", "entropy": 0.4898724853992462} +{"ts": "2026-01-29T21:45:33.579748Z", "loop": 995, "env_steps": 611328000, "exact_value_avg": 0.3454020023345947, "regret_dist": 0.45837539434432983, "regret_other_env": 0.7534828186035156, "regret_corner": 0.01571422442793846, "regret_row": 0.6621902585029602, "regret_any": 0.7534828186035156, "regret_bot": 0.7833909392356873, "value_dist": 0.3454020023345947, "value_other_env": 0.07607028633356094, "value_corner": 0.7493995428085327, "value_row": 0.13449878990650177, "value_any": 0.07607028633356094, "value_bot": 0.013298100791871548, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_00995.png", "entropy": 0.4306647479534149} +{"ts": "2026-01-29T21:45:39.424226Z", "loop": 1000, "env_steps": 614400000, "exact_value_avg": 0.34723588824272156, "regret_dist": 0.4565415382385254, "regret_other_env": 0.7522892951965332, "regret_corner": 0.01291980966925621, "regret_row": 0.6369480490684509, "regret_any": 0.7522892951965332, "regret_bot": 0.7864640355110168, "value_dist": 0.34723588824272156, "value_other_env": 0.07726384699344635, "value_corner": 0.7521939277648926, "value_row": 0.15974101424217224, "value_any": 0.07726384699344635, "value_bot": 0.010224931873381138, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01000.png", "entropy": 0.4388256072998047} +{"ts": "2026-01-29T21:45:45.270187Z", "loop": 1005, "env_steps": 617472000, "exact_value_avg": 0.347822904586792, "regret_dist": 0.45595449209213257, "regret_other_env": 0.7509522438049316, "regret_corner": 0.013457849621772766, "regret_row": 0.6251344084739685, "regret_any": 0.7509522438049316, "regret_bot": 0.7871195077896118, "value_dist": 0.347822904586792, "value_other_env": 0.07860086858272552, "value_corner": 0.7516558766365051, "value_row": 0.17155463993549347, "value_any": 0.07860086858272552, "value_bot": 0.009569439105689526, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01005.png", "entropy": 0.42010754346847534} +{"ts": "2026-01-29T21:45:51.119984Z", "loop": 1010, "env_steps": 620544000, "exact_value_avg": 0.3454344868659973, "regret_dist": 0.45834288001060486, "regret_other_env": 0.7493999600410461, "regret_corner": 0.021757209673523903, "regret_row": 0.6806691288948059, "regret_any": 0.7493999600410461, "regret_bot": 0.7758693695068359, "value_dist": 0.3454344868659973, "value_other_env": 0.08015315234661102, "value_corner": 0.743356466293335, "value_row": 0.11601994186639786, "value_any": 0.08015315234661102, "value_bot": 0.020819665864109993, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01010.png", "entropy": 0.32892534136772156} +{"ts": "2026-01-29T21:45:56.969640Z", "loop": 1015, "env_steps": 623616000, "exact_value_avg": 0.34443315863609314, "regret_dist": 0.4593442678451538, "regret_other_env": 0.7497420907020569, "regret_corner": 0.02374747395515442, "regret_row": 0.5896400213241577, "regret_any": 0.7497420907020569, "regret_bot": 0.7897486686706543, "value_dist": 0.34443315863609314, "value_other_env": 0.07981101423501968, "value_corner": 0.7413663268089294, "value_row": 0.20704904198646545, "value_any": 0.07981101423501968, "value_bot": 0.006940396502614021, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01015.png", "entropy": 0.3915739357471466} +{"ts": "2026-01-29T21:46:02.817357Z", "loop": 1020, "env_steps": 626688000, "exact_value_avg": 0.35292917490005493, "regret_dist": 0.45084819197654724, "regret_other_env": 0.7444397807121277, "regret_corner": 0.010460744611918926, "regret_row": 0.6701896786689758, "regret_any": 0.7444397807121277, "regret_bot": 0.77657550573349, "value_dist": 0.35292917490005493, "value_other_env": 0.08511330187320709, "value_corner": 0.7546529769897461, "value_row": 0.12649932503700256, "value_any": 0.08511330187320709, "value_bot": 0.02011353150010109, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01020.png", "entropy": 0.3104488253593445} +{"ts": "2026-01-29T21:46:08.661111Z", "loop": 1025, "env_steps": 629760000, "exact_value_avg": 0.35441869497299194, "regret_dist": 0.4493587017059326, "regret_other_env": 0.7434331178665161, "regret_corner": 0.008247047662734985, "regret_row": 0.617396891117096, "regret_any": 0.7434331178665161, "regret_bot": 0.7846845984458923, "value_dist": 0.35441869497299194, "value_other_env": 0.08612003177404404, "value_corner": 0.7568666934967041, "value_row": 0.17929211258888245, "value_any": 0.08612003177404404, "value_bot": 0.01200437918305397, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01025.png", "entropy": 0.320970356464386} +{"ts": "2026-01-29T21:46:14.522026Z", "loop": 1030, "env_steps": 632832000, "exact_value_avg": 0.35770922899246216, "regret_dist": 0.4460681676864624, "regret_other_env": 0.7395053505897522, "regret_corner": 0.00591230159625411, "regret_row": 0.6615312099456787, "regret_any": 0.7395053505897522, "regret_bot": 0.7751421332359314, "value_dist": 0.35770922899246216, "value_other_env": 0.09004772454500198, "value_corner": 0.7592014670372009, "value_row": 0.13515783846378326, "value_any": 0.09004772454500198, "value_bot": 0.02154696173965931, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01030.png", "entropy": 0.2714148163795471} +{"ts": "2026-01-29T21:46:20.370182Z", "loop": 1035, "env_steps": 635904000, "exact_value_avg": 0.35924309492111206, "regret_dist": 0.4445343315601349, "regret_other_env": 0.7374316453933716, "regret_corner": 0.00518830306828022, "regret_row": 0.6607203483581543, "regret_any": 0.7374316453933716, "regret_bot": 0.7742682695388794, "value_dist": 0.35924309492111206, "value_other_env": 0.09212150424718857, "value_corner": 0.7599254250526428, "value_row": 0.13596874475479126, "value_any": 0.09212150424718857, "value_bot": 0.022420821711421013, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01035.png", "entropy": 0.2593269348144531} +{"ts": "2026-01-29T21:46:26.218069Z", "loop": 1040, "env_steps": 638976000, "exact_value_avg": 0.3541161119937897, "regret_dist": 0.4496612548828125, "regret_other_env": 0.7403725981712341, "regret_corner": 0.013594157062470913, "regret_row": 0.5831127762794495, "regret_any": 0.7403725981712341, "regret_bot": 0.7867225408554077, "value_dist": 0.3541161119937897, "value_other_env": 0.08918046206235886, "value_corner": 0.7515195608139038, "value_row": 0.21357624232769012, "value_any": 0.08918046206235886, "value_bot": 0.009966546669602394, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01040.png", "entropy": 0.28203845024108887} +{"ts": "2026-01-29T21:46:32.066754Z", "loop": 1045, "env_steps": 642048000, "exact_value_avg": 0.35332778096199036, "regret_dist": 0.4504495859146118, "regret_other_env": 0.7382873296737671, "regret_corner": 0.018692903220653534, "regret_row": 0.6868754029273987, "regret_any": 0.7382873296737671, "regret_bot": 0.7655874490737915, "value_dist": 0.35332778096199036, "value_other_env": 0.0912657231092453, "value_corner": 0.7464208602905273, "value_row": 0.10981365293264389, "value_any": 0.0912657231092453, "value_bot": 0.031101621687412262, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01045.png", "entropy": 0.20510534942150116} +{"ts": "2026-01-29T21:46:37.922482Z", "loop": 1050, "env_steps": 645120000, "exact_value_avg": 0.36378034949302673, "regret_dist": 0.4399970471858978, "regret_other_env": 0.7316277623176575, "regret_corner": 0.0025509516708552837, "regret_row": 0.6250061392784119, "regret_any": 0.7316277623176575, "regret_bot": 0.7775651216506958, "value_dist": 0.36378034949302673, "value_other_env": 0.09792537987232208, "value_corner": 0.7625628113746643, "value_row": 0.17168289422988892, "value_any": 0.09792537987232208, "value_bot": 0.019123902544379234, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01050.png", "entropy": 0.2265980839729309} +{"ts": "2026-01-29T21:46:43.779204Z", "loop": 1055, "env_steps": 648192000, "exact_value_avg": 0.36380624771118164, "regret_dist": 0.43997108936309814, "regret_other_env": 0.7309914827346802, "regret_corner": 0.0034404434263706207, "regret_row": 0.6083471179008484, "regret_any": 0.7309914827346802, "regret_bot": 0.7798819541931152, "value_dist": 0.36380624771118164, "value_other_env": 0.09856155514717102, "value_corner": 0.7616732716560364, "value_row": 0.1883419156074524, "value_any": 0.09856155514717102, "value_bot": 0.01680714823305607, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01055.png", "entropy": 0.21853968501091003} +{"ts": "2026-01-29T21:46:49.632814Z", "loop": 1060, "env_steps": 651264000, "exact_value_avg": 0.35708603262901306, "regret_dist": 0.4466913640499115, "regret_other_env": 0.7337368726730347, "regret_corner": 0.016123026609420776, "regret_row": 0.688254714012146, "regret_any": 0.7337368726730347, "regret_bot": 0.7636255621910095, "value_dist": 0.35708603262901306, "value_other_env": 0.0958162397146225, "value_corner": 0.7489907145500183, "value_row": 0.10843440890312195, "value_any": 0.0958162397146225, "value_bot": 0.03306347876787186, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01060.png", "entropy": 0.17247644066810608} +{"ts": "2026-01-29T21:46:55.478130Z", "loop": 1065, "env_steps": 654336000, "exact_value_avg": 0.36783018708229065, "regret_dist": 0.4359471797943115, "regret_other_env": 0.7251457571983337, "regret_corner": 0.002149272011592984, "regret_row": 0.6568424701690674, "regret_any": 0.7251457571983337, "regret_bot": 0.768916666507721, "value_dist": 0.36783018708229065, "value_other_env": 0.10440730303525925, "value_corner": 0.7629644870758057, "value_row": 0.1398465931415558, "value_any": 0.10440730303525925, "value_bot": 0.02777235023677349, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01065.png", "entropy": 0.17518293857574463} +{"ts": "2026-01-29T21:47:01.336529Z", "loop": 1070, "env_steps": 657408000, "exact_value_avg": 0.36766791343688965, "regret_dist": 0.4361094832420349, "regret_other_env": 0.7253918647766113, "regret_corner": 0.0021858231630176306, "regret_row": 0.6048762202262878, "regret_any": 0.7253918647766113, "regret_bot": 0.7781373858451843, "value_dist": 0.36766791343688965, "value_other_env": 0.10416122525930405, "value_corner": 0.7629279494285583, "value_row": 0.19181281328201294, "value_any": 0.10416122525930405, "value_bot": 0.018551692366600037, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01070.png", "entropy": 0.17462198436260223} +{"ts": "2026-01-29T21:47:07.193025Z", "loop": 1075, "env_steps": 660480000, "exact_value_avg": 0.3693169951438904, "regret_dist": 0.4344603717327118, "regret_other_env": 0.722888171672821, "regret_corner": 0.0018186371307820082, "regret_row": 0.6020206212997437, "regret_any": 0.722888171672821, "regret_bot": 0.777346134185791, "value_dist": 0.3693169951438904, "value_other_env": 0.10666487365961075, "value_corner": 0.7632951140403748, "value_row": 0.19466842710971832, "value_any": 0.10666487365961075, "value_bot": 0.01934293657541275, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01075.png", "entropy": 0.16378597915172577} +{"ts": "2026-01-29T21:47:13.046407Z", "loop": 1080, "env_steps": 663552000, "exact_value_avg": 0.37227684259414673, "regret_dist": 0.43150052428245544, "regret_other_env": 0.718413770198822, "regret_corner": 0.0011306321248412132, "regret_row": 0.6494959592819214, "regret_any": 0.718413770198822, "regret_bot": 0.7665925025939941, "value_dist": 0.37227684259414673, "value_other_env": 0.11113931983709335, "value_corner": 0.7639831304550171, "value_row": 0.147193044424057, "value_any": 0.11113931983709335, "value_bot": 0.030096594244241714, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01080.png", "entropy": 0.14544491469860077} +{"ts": "2026-01-29T21:47:18.903198Z", "loop": 1085, "env_steps": 666624000, "exact_value_avg": 0.36661583185195923, "regret_dist": 0.4371615946292877, "regret_other_env": 0.7231757044792175, "regret_corner": 0.008140357211232185, "regret_row": 0.6822260618209839, "regret_any": 0.7231757044792175, "regret_bot": 0.7611579895019531, "value_dist": 0.36661583185195923, "value_other_env": 0.10637741535902023, "value_corner": 0.7569734454154968, "value_row": 0.1144629567861557, "value_any": 0.10637741535902023, "value_bot": 0.035531044006347656, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01085.png", "entropy": 0.1293761283159256} +{"ts": "2026-01-29T21:47:24.752572Z", "loop": 1090, "env_steps": 669696000, "exact_value_avg": 0.3740557134151459, "regret_dist": 0.4297216832637787, "regret_other_env": 0.715431809425354, "regret_corner": 0.0011564906453713775, "regret_row": 0.6538028717041016, "regret_any": 0.715431809425354, "regret_bot": 0.7643170952796936, "value_dist": 0.3740557134151459, "value_other_env": 0.11412132531404495, "value_corner": 0.7639572620391846, "value_row": 0.1428861916065216, "value_any": 0.11412132531404495, "value_bot": 0.03237197548151016, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01090.png", "entropy": 0.127830371260643} +{"ts": "2026-01-29T21:47:30.606406Z", "loop": 1095, "env_steps": 672768000, "exact_value_avg": 0.3764004707336426, "regret_dist": 0.427376925945282, "regret_other_env": 0.711999237537384, "regret_corner": 0.0004433552676346153, "regret_row": 0.6138641834259033, "regret_any": 0.711999237537384, "regret_bot": 0.7707250118255615, "value_dist": 0.3764004707336426, "value_other_env": 0.11755385994911194, "value_corner": 0.7646703720092773, "value_row": 0.18282485008239746, "value_any": 0.11755385994911194, "value_bot": 0.025964008644223213, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01095.png", "entropy": 0.13030670583248138} +{"ts": "2026-01-29T21:47:36.460157Z", "loop": 1100, "env_steps": 675840000, "exact_value_avg": 0.37802058458328247, "regret_dist": 0.4257567822933197, "regret_other_env": 0.7093545794487, "regret_corner": 0.0003599931951612234, "regret_row": 0.6148480772972107, "regret_any": 0.7093545794487, "regret_bot": 0.7687214016914368, "value_dist": 0.37802058458328247, "value_other_env": 0.12019850313663483, "value_corner": 0.7647537589073181, "value_row": 0.18184100091457367, "value_any": 0.12019850313663483, "value_bot": 0.02796764299273491, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01100.png", "entropy": 0.12499206513166428} +{"ts": "2026-01-29T21:47:42.300717Z", "loop": 1105, "env_steps": 678912000, "exact_value_avg": 0.37512844800949097, "regret_dist": 0.428648978471756, "regret_other_env": 0.7124559283256531, "regret_corner": 0.0029385434463620186, "regret_row": 0.6631210446357727, "regret_any": 0.7124559283256531, "regret_bot": 0.7605629563331604, "value_dist": 0.37512844800949097, "value_other_env": 0.11709725111722946, "value_corner": 0.7621752023696899, "value_row": 0.1335679590702057, "value_any": 0.11709725111722946, "value_bot": 0.03612612560391426, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01105.png", "entropy": 0.11267243325710297} +{"ts": "2026-01-29T21:47:48.140238Z", "loop": 1110, "env_steps": 681984000, "exact_value_avg": 0.3778272867202759, "regret_dist": 0.4259500503540039, "regret_other_env": 0.709018349647522, "regret_corner": 0.00134762329980731, "regret_row": 0.5718932747840881, "regret_any": 0.709018349647522, "regret_bot": 0.774095356464386, "value_dist": 0.3778272867202759, "value_other_env": 0.1205347552895546, "value_corner": 0.7637661099433899, "value_row": 0.22479577362537384, "value_any": 0.1205347552895546, "value_bot": 0.0225936658680439, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01110.png", "entropy": 0.11977872252464294} +{"ts": "2026-01-29T21:47:53.986552Z", "loop": 1115, "env_steps": 685056000, "exact_value_avg": 0.3818233013153076, "regret_dist": 0.42195403575897217, "regret_other_env": 0.7030811905860901, "regret_corner": 0.0002632563409861177, "regret_row": 0.6137887835502625, "regret_any": 0.7030811905860901, "regret_bot": 0.7644173502922058, "value_dist": 0.3818233013153076, "value_other_env": 0.1264718770980835, "value_corner": 0.7648504376411438, "value_row": 0.18290027976036072, "value_any": 0.1264718770980835, "value_bot": 0.03227168694138527, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01115.png", "entropy": 0.10967004299163818} +{"ts": "2026-01-29T21:47:59.842461Z", "loop": 1120, "env_steps": 688128000, "exact_value_avg": 0.3805125951766968, "regret_dist": 0.4232648015022278, "regret_other_env": 0.7043535113334656, "regret_corner": 0.0016316692344844341, "regret_row": 0.6459828019142151, "regret_any": 0.7043535113334656, "regret_bot": 0.7601730823516846, "value_dist": 0.3805125951766968, "value_other_env": 0.12519961595535278, "value_corner": 0.7634820938110352, "value_row": 0.1507062166929245, "value_any": 0.12519961595535278, "value_bot": 0.036516014486551285, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01120.png", "entropy": 0.10525773465633392} +{"ts": "2026-01-29T21:48:05.690980Z", "loop": 1125, "env_steps": 691200000, "exact_value_avg": 0.3818280100822449, "regret_dist": 0.4219494163990021, "regret_other_env": 0.7018311023712158, "regret_corner": 0.0021268557757139206, "regret_row": 0.646362841129303, "regret_any": 0.7018311023712158, "regret_bot": 0.7599084377288818, "value_dist": 0.3818280100822449, "value_other_env": 0.12772203981876373, "value_corner": 0.7629868984222412, "value_row": 0.1503261923789978, "value_any": 0.12772203981876373, "value_bot": 0.03678061068058014, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01125.png", "entropy": 0.1068619042634964} +{"ts": "2026-01-29T21:48:11.546341Z", "loop": 1130, "env_steps": 694272000, "exact_value_avg": 0.38677701354026794, "regret_dist": 0.41700032353401184, "regret_other_env": 0.6948273777961731, "regret_corner": 0.00025975905009545386, "regret_row": 0.5981767177581787, "regret_any": 0.6948273777961731, "regret_bot": 0.7637208104133606, "value_dist": 0.38677701354026794, "value_other_env": 0.13472570478916168, "value_corner": 0.7648539543151855, "value_row": 0.1985122561454773, "value_any": 0.13472570478916168, "value_bot": 0.03296825289726257, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01130.png", "entropy": 0.11418229341506958} +{"ts": "2026-01-29T21:48:17.390456Z", "loop": 1135, "env_steps": 697344000, "exact_value_avg": 0.38815054297447205, "regret_dist": 0.4156268239021301, "regret_other_env": 0.6924306750297546, "regret_corner": 0.0004210154293105006, "regret_row": 0.610941469669342, "regret_any": 0.6924306750297546, "regret_bot": 0.7616288065910339, "value_dist": 0.38815054297447205, "value_other_env": 0.13712242245674133, "value_corner": 0.7646927237510681, "value_row": 0.18574751913547516, "value_any": 0.13712242245674133, "value_bot": 0.035060226917266846, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01135.png", "entropy": 0.11495423316955566} +{"ts": "2026-01-29T21:48:23.231270Z", "loop": 1140, "env_steps": 700416000, "exact_value_avg": 0.39055395126342773, "regret_dist": 0.4132234454154968, "regret_other_env": 0.6884918808937073, "regret_corner": 0.00032072814065031707, "regret_row": 0.5694088935852051, "regret_any": 0.6884918808937073, "regret_bot": 0.765442967414856, "value_dist": 0.39055395126342773, "value_other_env": 0.1410612314939499, "value_corner": 0.7647929787635803, "value_row": 0.2272801697254181, "value_any": 0.1410612314939499, "value_bot": 0.031246067956089973, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01140.png", "entropy": 0.12266241014003754} +{"ts": "2026-01-29T21:48:29.077342Z", "loop": 1145, "env_steps": 703488000, "exact_value_avg": 0.39202529191970825, "regret_dist": 0.4117521643638611, "regret_other_env": 0.6859574317932129, "regret_corner": 0.00044418973266147077, "regret_row": 0.5524275302886963, "regret_any": 0.6859574317932129, "regret_bot": 0.7664790749549866, "value_dist": 0.39202529191970825, "value_other_env": 0.14359575510025024, "value_corner": 0.7646695375442505, "value_row": 0.24426153302192688, "value_any": 0.14359575510025024, "value_bot": 0.03021000325679779, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01145.png", "entropy": 0.12904193997383118} +{"ts": "2026-01-29T21:48:34.922620Z", "loop": 1150, "env_steps": 706560000, "exact_value_avg": 0.3954629898071289, "regret_dist": 0.40831440687179565, "regret_other_env": 0.6801308393478394, "regret_corner": 0.0005897343507967889, "regret_row": 0.5838687419891357, "regret_any": 0.6801308393478394, "regret_bot": 0.7609490156173706, "value_dist": 0.3954629898071289, "value_other_env": 0.1494223028421402, "value_corner": 0.764523983001709, "value_row": 0.21282030642032623, "value_any": 0.1494223028421402, "value_bot": 0.03574003651738167, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01150.png", "entropy": 0.12485421448945999} +{"ts": "2026-01-29T21:48:40.773941Z", "loop": 1155, "env_steps": 709632000, "exact_value_avg": 0.39762333035469055, "regret_dist": 0.406154066324234, "regret_other_env": 0.6763768792152405, "regret_corner": 0.0008198221912607551, "regret_row": 0.5835322141647339, "regret_any": 0.6763768792152405, "regret_bot": 0.760286808013916, "value_dist": 0.39762333035469055, "value_other_env": 0.15317624807357788, "value_corner": 0.7642939686775208, "value_row": 0.2131568342447281, "value_any": 0.15317624807357788, "value_bot": 0.03640223294496536, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01155.png", "entropy": 0.12483060359954834} +{"ts": "2026-01-29T21:48:46.627201Z", "loop": 1160, "env_steps": 712704000, "exact_value_avg": 0.4001181721687317, "regret_dist": 0.40365922451019287, "regret_other_env": 0.6725462675094604, "regret_corner": 0.0003286272403784096, "regret_row": 0.5447531938552856, "regret_any": 0.6725462675094604, "regret_bot": 0.7624202966690063, "value_dist": 0.4001181721687317, "value_other_env": 0.15700684487819672, "value_corner": 0.76478511095047, "value_row": 0.2519358694553375, "value_any": 0.15700684487819672, "value_bot": 0.034268755465745926, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01160.png", "entropy": 0.12909583747386932} +{"ts": "2026-01-29T21:48:52.472220Z", "loop": 1165, "env_steps": 715776000, "exact_value_avg": 0.40283501148223877, "regret_dist": 0.4009423851966858, "regret_other_env": 0.6680217981338501, "regret_corner": 0.00032322161132469773, "regret_row": 0.5415961146354675, "regret_any": 0.6680217981338501, "regret_bot": 0.7616634368896484, "value_dist": 0.40283501148223877, "value_other_env": 0.16153131425380707, "value_corner": 0.7647905349731445, "value_row": 0.25509291887283325, "value_any": 0.16153131425380707, "value_bot": 0.035025689750909805, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01165.png", "entropy": 0.12971358001232147} +{"ts": "2026-01-29T21:48:58.316537Z", "loop": 1170, "env_steps": 718848000, "exact_value_avg": 0.4012329578399658, "regret_dist": 0.40254443883895874, "regret_other_env": 0.6685153245925903, "regret_corner": 0.0035880517680197954, "regret_row": 0.5834647417068481, "regret_any": 0.6685153245925903, "regret_bot": 0.7592902779579163, "value_dist": 0.4012329578399658, "value_other_env": 0.16103780269622803, "value_corner": 0.7615256905555725, "value_row": 0.21322430670261383, "value_any": 0.16103780269622803, "value_bot": 0.03739874064922333, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01170.png", "entropy": 0.12442255020141602} +{"ts": "2026-01-29T21:49:04.154912Z", "loop": 1175, "env_steps": 721920000, "exact_value_avg": 0.4056750237941742, "regret_dist": 0.39810240268707275, "regret_other_env": 0.6631520986557007, "regret_corner": 0.0005278120515868068, "regret_row": 0.5220722556114197, "regret_any": 0.6631520986557007, "regret_bot": 0.7628808617591858, "value_dist": 0.4056750237941742, "value_other_env": 0.16640104353427887, "value_corner": 0.7645859122276306, "value_row": 0.2746168076992035, "value_any": 0.16640104353427887, "value_bot": 0.03380821645259857, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01175.png", "entropy": 0.138429194688797} +{"ts": "2026-01-29T21:49:09.995357Z", "loop": 1180, "env_steps": 724992000, "exact_value_avg": 0.4069691598415375, "regret_dist": 0.3968082070350647, "regret_other_env": 0.659285843372345, "regret_corner": 0.0030916801188141108, "regret_row": 0.5611502528190613, "regret_any": 0.659285843372345, "regret_bot": 0.7593525648117065, "value_dist": 0.4069691598415375, "value_other_env": 0.17026720941066742, "value_corner": 0.762022078037262, "value_row": 0.2355387806892395, "value_any": 0.17026720941066742, "value_bot": 0.037336524575948715, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01180.png", "entropy": 0.13093531131744385} +{"ts": "2026-01-29T21:49:15.836780Z", "loop": 1185, "env_steps": 728064000, "exact_value_avg": 0.41403037309646606, "regret_dist": 0.3897469639778137, "regret_other_env": 0.6493311524391174, "regret_corner": 0.0003706991847138852, "regret_row": 0.5364789366722107, "regret_any": 0.6493311524391174, "regret_bot": 0.7602945566177368, "value_dist": 0.41403037309646606, "value_other_env": 0.18022193014621735, "value_corner": 0.7647430300712585, "value_row": 0.2602101266384125, "value_any": 0.18022193014621735, "value_bot": 0.03639442101120949, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01185.png", "entropy": 0.1404143124818802} +{"ts": "2026-01-29T21:49:21.678911Z", "loop": 1190, "env_steps": 731136000, "exact_value_avg": 0.39505499601364136, "regret_dist": 0.4087224304676056, "regret_other_env": 0.6781810522079468, "regret_corner": 0.004534433595836163, "regret_row": 0.4646720886230469, "regret_any": 0.6781810522079468, "regret_bot": 0.7733643054962158, "value_dist": 0.39505499601364136, "value_other_env": 0.15137207508087158, "value_corner": 0.7605793476104736, "value_row": 0.3320169448852539, "value_any": 0.15137207508087158, "value_bot": 0.023324737325310707, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01190.png", "entropy": 0.1667395383119583} +{"ts": "2026-01-29T21:49:27.523567Z", "loop": 1195, "env_steps": 734208000, "exact_value_avg": 0.4121881127357483, "regret_dist": 0.3915892243385315, "regret_other_env": 0.6513341069221497, "regret_corner": 0.001971901161596179, "regret_row": 0.5513389706611633, "regret_any": 0.6513341069221497, "regret_bot": 0.75958251953125, "value_dist": 0.4121881127357483, "value_other_env": 0.17821896076202393, "value_corner": 0.7631418108940125, "value_row": 0.24535010755062103, "value_any": 0.17821896076202393, "value_bot": 0.03710648790001869, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01195.png", "entropy": 0.1402483582496643} +{"ts": "2026-01-29T21:49:33.370759Z", "loop": 1200, "env_steps": 737280000, "exact_value_avg": 0.4185676872730255, "regret_dist": 0.38520967960357666, "regret_other_env": 0.6417370438575745, "regret_corner": 0.00041855673771351576, "regret_row": 0.531633198261261, "regret_any": 0.6417370438575745, "regret_bot": 0.759997546672821, "value_dist": 0.4185676872730255, "value_other_env": 0.18781600892543793, "value_corner": 0.7646951675415039, "value_row": 0.2650558054447174, "value_any": 0.18781600892543793, "value_bot": 0.03669150173664093, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01200.png", "entropy": 0.1417330652475357} +{"ts": "2026-01-29T21:49:39.212659Z", "loop": 1205, "env_steps": 740352000, "exact_value_avg": 0.4221406579017639, "regret_dist": 0.38163667917251587, "regret_other_env": 0.6358450055122375, "regret_corner": 0.0003241886734031141, "regret_row": 0.49427804350852966, "regret_any": 0.6358450055122375, "regret_bot": 0.7614107728004456, "value_dist": 0.4221406579017639, "value_other_env": 0.19370810687541962, "value_corner": 0.7647895216941833, "value_row": 0.3024109899997711, "value_any": 0.19370810687541962, "value_bot": 0.03527823090553284, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01205.png", "entropy": 0.1462474763393402} +{"ts": "2026-01-29T21:49:45.065826Z", "loop": 1210, "env_steps": 743424000, "exact_value_avg": 0.42077866196632385, "regret_dist": 0.3829987049102783, "regret_other_env": 0.6379602551460266, "regret_corner": 0.0005563234444707632, "regret_row": 0.46800458431243896, "regret_any": 0.6379602551460266, "regret_bot": 0.7632701396942139, "value_dist": 0.42077866196632385, "value_other_env": 0.19159281253814697, "value_corner": 0.764557421207428, "value_row": 0.3286844789981842, "value_any": 0.19159281253814697, "value_bot": 0.03341897204518318, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01210.png", "entropy": 0.14914599061012268} +{"ts": "2026-01-29T21:49:50.916174Z", "loop": 1215, "env_steps": 746496000, "exact_value_avg": 0.42651641368865967, "regret_dist": 0.3772609531879425, "regret_other_env": 0.6285707354545593, "regret_corner": 0.000296220212476328, "regret_row": 0.47198906540870667, "regret_any": 0.6285707354545593, "regret_bot": 0.7609319090843201, "value_dist": 0.42651641368865967, "value_other_env": 0.20098234713077545, "value_corner": 0.7648175358772278, "value_row": 0.3247000277042389, "value_any": 0.20098234713077545, "value_bot": 0.035757169127464294, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01215.png", "entropy": 0.14662739634513855} +{"ts": "2026-01-29T21:49:56.766334Z", "loop": 1220, "env_steps": 749568000, "exact_value_avg": 0.4286162853240967, "regret_dist": 0.3751610815525055, "regret_other_env": 0.6250663995742798, "regret_corner": 0.00030308219720609486, "regret_row": 0.4692293107509613, "regret_any": 0.6250663995742798, "regret_bot": 0.7601718306541443, "value_dist": 0.4286162853240967, "value_other_env": 0.2044866681098938, "value_corner": 0.7648106217384338, "value_row": 0.32745975255966187, "value_any": 0.2044866681098938, "value_bot": 0.036517199128866196, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01220.png", "entropy": 0.14775089919567108} +{"ts": "2026-01-29T21:50:02.614203Z", "loop": 1225, "env_steps": 752640000, "exact_value_avg": 0.4221496880054474, "regret_dist": 0.3816276788711548, "regret_other_env": 0.6335886716842651, "regret_corner": 0.0036861500702798367, "regret_row": 0.5120340585708618, "regret_any": 0.6335886716842651, "regret_bot": 0.7590892910957336, "value_dist": 0.4221496880054474, "value_other_env": 0.19596442580223083, "value_corner": 0.7614275813102722, "value_row": 0.2846549153327942, "value_any": 0.19596442580223083, "value_bot": 0.037599749863147736, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01225.png", "entropy": 0.13823631405830383} +{"ts": "2026-01-29T21:50:08.464071Z", "loop": 1230, "env_steps": 755712000, "exact_value_avg": 0.4276054799556732, "regret_dist": 0.37617188692092896, "regret_other_env": 0.626657247543335, "regret_corner": 0.00044383161002770066, "regret_row": 0.45204660296440125, "regret_any": 0.626657247543335, "regret_bot": 0.7616339325904846, "value_dist": 0.4276054799556732, "value_other_env": 0.20289583504199982, "value_corner": 0.7646698951721191, "value_row": 0.34464243054389954, "value_any": 0.20289583504199982, "value_bot": 0.03505513444542885, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01230.png", "entropy": 0.1439301073551178} +{"ts": "2026-01-29T21:50:14.317377Z", "loop": 1235, "env_steps": 758784000, "exact_value_avg": 0.4315257966518402, "regret_dist": 0.3722515404224396, "regret_other_env": 0.6203078627586365, "regret_corner": 0.00016700626292731613, "regret_row": 0.4610995948314667, "regret_any": 0.6203078627586365, "regret_bot": 0.7602264285087585, "value_dist": 0.4315257966518402, "value_other_env": 0.2092452347278595, "value_corner": 0.7649466395378113, "value_row": 0.3355894684791565, "value_any": 0.2092452347278595, "value_bot": 0.036462604999542236, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01235.png", "entropy": 0.13631920516490936} +{"ts": "2026-01-29T21:50:20.166100Z", "loop": 1240, "env_steps": 761856000, "exact_value_avg": 0.42892277240753174, "regret_dist": 0.3748546540737152, "regret_other_env": 0.6245506405830383, "regret_corner": 0.0003105854266323149, "regret_row": 0.49323931336402893, "regret_any": 0.6245506405830383, "regret_bot": 0.7590226531028748, "value_dist": 0.42892277240753174, "value_other_env": 0.20500245690345764, "value_corner": 0.7648031711578369, "value_row": 0.30344972014427185, "value_any": 0.20500245690345764, "value_bot": 0.03766637668013573, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01240.png", "entropy": 0.12299049645662308} +{"ts": "2026-01-29T21:50:26.013578Z", "loop": 1245, "env_steps": 764928000, "exact_value_avg": 0.4330071210861206, "regret_dist": 0.37077030539512634, "regret_other_env": 0.6178839206695557, "regret_corner": 9.980351023841649e-05, "regret_row": 0.4701249897480011, "regret_any": 0.6178839206695557, "regret_bot": 0.7594554424285889, "value_dist": 0.4330071210861206, "value_other_env": 0.21166925132274628, "value_corner": 0.7650139331817627, "value_row": 0.32656407356262207, "value_any": 0.21166925132274628, "value_bot": 0.03723359480500221, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01245.png", "entropy": 0.12780430912971497} +{"ts": "2026-01-29T21:50:31.855264Z", "loop": 1250, "env_steps": 768000000, "exact_value_avg": 0.43283480405807495, "regret_dist": 0.3709425926208496, "regret_other_env": 0.6181679964065552, "regret_corner": 0.0001044521777657792, "regret_row": 0.4554857909679413, "regret_any": 0.6181679964065552, "regret_bot": 0.7607173919677734, "value_dist": 0.43283480405807495, "value_other_env": 0.21138516068458557, "value_corner": 0.7650092840194702, "value_row": 0.3412032723426819, "value_any": 0.21138516068458557, "value_bot": 0.03597169369459152, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01250.png", "entropy": 0.13147896528244019} +{"ts": "2026-01-29T21:50:37.702581Z", "loop": 1255, "env_steps": 771072000, "exact_value_avg": 0.43401578068733215, "regret_dist": 0.36976158618927, "regret_other_env": 0.6162045001983643, "regret_corner": 9.718487854115665e-05, "regret_row": 0.4671672284603119, "regret_any": 0.6162045001983643, "regret_bot": 0.7595524191856384, "value_dist": 0.43401578068733215, "value_other_env": 0.21334856748580933, "value_corner": 0.7650165557861328, "value_row": 0.3295218348503113, "value_any": 0.21334856748580933, "value_bot": 0.037136659026145935, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01255.png", "entropy": 0.13123835623264313} +{"ts": "2026-01-29T21:50:43.549129Z", "loop": 1260, "env_steps": 774144000, "exact_value_avg": 0.43427586555480957, "regret_dist": 0.3695015013217926, "regret_other_env": 0.6157525777816772, "regret_corner": 0.00012485336628742516, "regret_row": 0.46574318408966064, "regret_any": 0.6157525777816772, "regret_bot": 0.7595979571342468, "value_dist": 0.43427586555480957, "value_other_env": 0.21380050480365753, "value_corner": 0.764988899230957, "value_row": 0.33094584941864014, "value_any": 0.21380050480365753, "value_bot": 0.03709104284644127, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01260.png", "entropy": 0.13723960518836975} +{"ts": "2026-01-29T21:50:49.395097Z", "loop": 1265, "env_steps": 777216000, "exact_value_avg": 0.43421679735183716, "regret_dist": 0.3695605993270874, "regret_other_env": 0.6158595681190491, "regret_corner": 0.00011209498188691214, "regret_row": 0.44573673605918884, "regret_any": 0.6158595681190491, "regret_bot": 0.761139452457428, "value_dist": 0.43421679735183716, "value_other_env": 0.2136935591697693, "value_corner": 0.7650015950202942, "value_row": 0.3509523272514343, "value_any": 0.2136935591697693, "value_bot": 0.035549554973840714, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01265.png", "entropy": 0.14418689906597137} +{"ts": "2026-01-29T21:50:55.239908Z", "loop": 1270, "env_steps": 780288000, "exact_value_avg": 0.427738219499588, "regret_dist": 0.37603914737701416, "regret_other_env": 0.6263852119445801, "regret_corner": 0.0005199581501074135, "regret_row": 0.42952078580856323, "regret_any": 0.6263852119445801, "regret_bot": 0.7659123539924622, "value_dist": 0.427738219499588, "value_other_env": 0.2031678557395935, "value_corner": 0.764593780040741, "value_row": 0.36716824769973755, "value_any": 0.2031678557395935, "value_bot": 0.030776681378483772, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01270.png", "entropy": 0.1443345993757248} +{"ts": "2026-01-29T21:51:01.085125Z", "loop": 1275, "env_steps": 783360000, "exact_value_avg": 0.4357307553291321, "regret_dist": 0.3680466413497925, "regret_other_env": 0.6133568286895752, "regret_corner": 8.135140524245799e-05, "regret_row": 0.4520045220851898, "regret_any": 0.6133568286895752, "regret_bot": 0.7597522735595703, "value_dist": 0.4357307553291321, "value_other_env": 0.21619628369808197, "value_corner": 0.7650323510169983, "value_row": 0.34468451142311096, "value_any": 0.21619628369808197, "value_bot": 0.03693676367402077, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01275.png", "entropy": 0.1344870924949646} +{"ts": "2026-01-29T21:51:06.930097Z", "loop": 1280, "env_steps": 786432000, "exact_value_avg": 0.4265361428260803, "regret_dist": 0.37724125385284424, "regret_other_env": 0.6269473433494568, "regret_corner": 0.0026820541825145483, "regret_row": 0.5133922100067139, "regret_any": 0.6269473433494568, "regret_bot": 0.7588053345680237, "value_dist": 0.4265361428260803, "value_other_env": 0.20260575413703918, "value_corner": 0.7624316811561584, "value_row": 0.2832968533039093, "value_any": 0.20260575413703918, "value_bot": 0.037883758544921875, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01280.png", "entropy": 0.11697281897068024} +{"ts": "2026-01-29T21:51:12.780280Z", "loop": 1285, "env_steps": 789504000, "exact_value_avg": 0.4364768862724304, "regret_dist": 0.36730048060417175, "regret_other_env": 0.6121286153793335, "regret_corner": 5.822927050758153e-05, "regret_row": 0.4448246657848358, "regret_any": 0.6121286153793335, "regret_bot": 0.7598959803581238, "value_dist": 0.4364768862724304, "value_other_env": 0.21742446720600128, "value_corner": 0.7650554776191711, "value_row": 0.35186439752578735, "value_any": 0.21742446720600128, "value_bot": 0.03679307550191879, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01285.png", "entropy": 0.12797118723392487} +{"ts": "2026-01-29T21:51:18.651390Z", "loop": 1290, "env_steps": 792576000, "exact_value_avg": 0.421828955411911, "regret_dist": 0.38194841146469116, "regret_other_env": 0.635917067527771, "regret_corner": 0.0009954065317288041, "regret_row": 0.4220641851425171, "regret_any": 0.635917067527771, "regret_bot": 0.7696853876113892, "value_dist": 0.421828955411911, "value_other_env": 0.1936360001564026, "value_corner": 0.7641183733940125, "value_row": 0.3746248185634613, "value_any": 0.1936360001564026, "value_bot": 0.02700362540781498, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01290.png", "entropy": 0.13281017541885376} +{"ts": "2026-01-29T21:51:24.509607Z", "loop": 1295, "env_steps": 795648000, "exact_value_avg": 0.42995163798332214, "regret_dist": 0.37382566928863525, "regret_other_env": 0.6223961114883423, "regret_corner": 0.0009700015652924776, "regret_row": 0.5010429620742798, "regret_any": 0.6223961114883423, "regret_bot": 0.7587884664535522, "value_dist": 0.42995163798332214, "value_other_env": 0.2071569412946701, "value_corner": 0.764143705368042, "value_row": 0.295646071434021, "value_any": 0.2071569412946701, "value_bot": 0.03790055215358734, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01295.png", "entropy": 0.10851765424013138} +{"ts": "2026-01-29T21:51:30.360157Z", "loop": 1300, "env_steps": 798720000, "exact_value_avg": 0.4291389584541321, "regret_dist": 0.3746383786201477, "regret_other_env": 0.6240674257278442, "regret_corner": 0.0004948084824718535, "regret_row": 0.5124473571777344, "regret_any": 0.6240674257278442, "regret_bot": 0.7588193416595459, "value_dist": 0.4291389584541321, "value_other_env": 0.20548564195632935, "value_corner": 0.7646189332008362, "value_row": 0.2842416763305664, "value_any": 0.20548564195632935, "value_bot": 0.0378696471452713, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01300.png", "entropy": 0.10482259094715118} +{"ts": "2026-01-29T21:51:36.221334Z", "loop": 1305, "env_steps": 801792000, "exact_value_avg": 0.4364442229270935, "regret_dist": 0.36733317375183105, "regret_other_env": 0.6121949553489685, "regret_corner": 4.043678563903086e-05, "regret_row": 0.4609852135181427, "regret_any": 0.6121949553489685, "regret_bot": 0.7595961689949036, "value_dist": 0.4364442229270935, "value_other_env": 0.21735815703868866, "value_corner": 0.765073299407959, "value_row": 0.33570384979248047, "value_any": 0.21735815703868866, "value_bot": 0.037092842161655426, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01305.png", "entropy": 0.11598570644855499} +{"ts": "2026-01-29T21:51:42.073673Z", "loop": 1310, "env_steps": 804864000, "exact_value_avg": 0.4314045310020447, "regret_dist": 0.3723727762699127, "regret_other_env": 0.6205105781555176, "regret_corner": 0.00016604166012257338, "regret_row": 0.42712387442588806, "regret_any": 0.6205105781555176, "regret_bot": 0.768519401550293, "value_dist": 0.4314045310020447, "value_other_env": 0.20904244482517242, "value_corner": 0.7649476528167725, "value_row": 0.3695651888847351, "value_any": 0.20904244482517242, "value_bot": 0.028169715777039528, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01310.png", "entropy": 0.13433164358139038} +{"ts": "2026-01-29T21:51:47.934665Z", "loop": 1315, "env_steps": 807936000, "exact_value_avg": 0.4365975856781006, "regret_dist": 0.3671797513961792, "regret_other_env": 0.6119158864021301, "regret_corner": 7.556081254733726e-05, "regret_row": 0.4306558072566986, "regret_any": 0.6119158864021301, "regret_bot": 0.7631294131278992, "value_dist": 0.4365975856781006, "value_other_env": 0.21763719618320465, "value_corner": 0.7650381326675415, "value_row": 0.36603325605392456, "value_any": 0.21763719618320465, "value_bot": 0.03355960175395012, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01315.png", "entropy": 0.1288578063249588} +{"ts": "2026-01-29T21:51:53.786264Z", "loop": 1320, "env_steps": 811008000, "exact_value_avg": 0.4381750822067261, "regret_dist": 0.3656022548675537, "regret_other_env": 0.6093089580535889, "regret_corner": 4.219114998704754e-05, "regret_row": 0.4373178482055664, "regret_any": 0.6093089580535889, "regret_bot": 0.760255753993988, "value_dist": 0.4381750822067261, "value_other_env": 0.22024410963058472, "value_corner": 0.7650715112686157, "value_row": 0.3593711853027344, "value_any": 0.22024410963058472, "value_bot": 0.03643331676721573, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01320.png", "entropy": 0.12111897766590118} +{"ts": "2026-01-29T21:51:59.639011Z", "loop": 1325, "env_steps": 814080000, "exact_value_avg": 0.43629589676856995, "regret_dist": 0.3674814999103546, "regret_other_env": 0.612430214881897, "regret_corner": 5.8382753195473924e-05, "regret_row": 0.4656754732131958, "regret_any": 0.612430214881897, "regret_bot": 0.7590181827545166, "value_dist": 0.43629589676856995, "value_other_env": 0.21712292730808258, "value_corner": 0.7650553584098816, "value_row": 0.331013560295105, "value_any": 0.21712292730808258, "value_bot": 0.03767084702849388, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01325.png", "entropy": 0.10768785327672958} +{"ts": "2026-01-29T21:52:05.494991Z", "loop": 1330, "env_steps": 817152000, "exact_value_avg": 0.43704473972320557, "regret_dist": 0.3667326867580414, "regret_other_env": 0.6111905574798584, "regret_corner": 4.5810145820723847e-05, "regret_row": 0.4586055874824524, "regret_any": 0.6111905574798584, "regret_bot": 0.7590315937995911, "value_dist": 0.43704473972320557, "value_other_env": 0.21836252510547638, "value_corner": 0.765067994594574, "value_row": 0.3380834460258484, "value_any": 0.21836252510547638, "value_bot": 0.037657417356967926, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01330.png", "entropy": 0.10722249746322632} +{"ts": "2026-01-29T21:52:11.353666Z", "loop": 1335, "env_steps": 820224000, "exact_value_avg": 0.4384186267852783, "regret_dist": 0.36535876989364624, "regret_other_env": 0.6089069247245789, "regret_corner": 3.6533179809339345e-05, "regret_row": 0.4448152482509613, "regret_any": 0.6089069247245789, "regret_bot": 0.7592253088951111, "value_dist": 0.4384186267852783, "value_other_env": 0.2206462323665619, "value_corner": 0.7650772333145142, "value_row": 0.3518737554550171, "value_any": 0.2206462323665619, "value_bot": 0.03746374696493149, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01335.png", "entropy": 0.11293066293001175} +{"ts": "2026-01-29T21:52:17.207313Z", "loop": 1340, "env_steps": 823296000, "exact_value_avg": 0.43910032510757446, "regret_dist": 0.3646770715713501, "regret_other_env": 0.6077684760093689, "regret_corner": 3.990034383605234e-05, "regret_row": 0.4388771653175354, "regret_any": 0.6077684760093689, "regret_bot": 0.7594007849693298, "value_dist": 0.43910032510757446, "value_other_env": 0.22178462147712708, "value_corner": 0.765073835849762, "value_row": 0.3578118681907654, "value_any": 0.22178462147712708, "value_bot": 0.037288226187229156, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01340.png", "entropy": 0.11915542930364609} +{"ts": "2026-01-29T21:52:23.070732Z", "loop": 1345, "env_steps": 826368000, "exact_value_avg": 0.4363216459751129, "regret_dist": 0.36745575070381165, "regret_other_env": 0.6123008131980896, "regret_corner": 0.00018811972404364496, "regret_row": 0.4129216969013214, "regret_any": 0.6123008131980896, "regret_bot": 0.763419508934021, "value_dist": 0.4363216459751129, "value_other_env": 0.21725226938724518, "value_corner": 0.7649256587028503, "value_row": 0.38376736640930176, "value_any": 0.21725226938724518, "value_bot": 0.03326947242021561, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01345.png", "entropy": 0.13310328125953674} +{"ts": "2026-01-29T21:52:28.937730Z", "loop": 1350, "env_steps": 829440000, "exact_value_avg": 0.4391435980796814, "regret_dist": 0.36463379859924316, "regret_other_env": 0.6076805591583252, "regret_corner": 6.360858969856054e-05, "regret_row": 0.42263469099998474, "regret_any": 0.6076805591583252, "regret_bot": 0.760773777961731, "value_dist": 0.4391435980796814, "value_other_env": 0.22187258303165436, "value_corner": 0.7650501132011414, "value_row": 0.3740543723106384, "value_any": 0.22187258303165436, "value_bot": 0.035915207117795944, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01350.png", "entropy": 0.1283387690782547} +{"ts": "2026-01-29T21:52:34.788293Z", "loop": 1355, "env_steps": 832512000, "exact_value_avg": 0.43891996145248413, "regret_dist": 0.36485737562179565, "regret_other_env": 0.6080442667007446, "regret_corner": 7.707426993874833e-05, "regret_row": 0.4448857605457306, "regret_any": 0.6080442667007446, "regret_bot": 0.759027898311615, "value_dist": 0.43891996145248413, "value_other_env": 0.22150875627994537, "value_corner": 0.7650367021560669, "value_row": 0.3518033027648926, "value_any": 0.22150875627994537, "value_bot": 0.037661146372556686, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01355.png", "entropy": 0.1157425120472908} +{"ts": "2026-01-29T21:52:40.652430Z", "loop": 1360, "env_steps": 835584000, "exact_value_avg": 0.43050822615623474, "regret_dist": 0.37326908111572266, "regret_other_env": 0.6208339333534241, "regret_corner": 0.0019218241795897484, "regret_row": 0.5070534944534302, "regret_any": 0.6208339333534241, "regret_bot": 0.7587504982948303, "value_dist": 0.43050822615623474, "value_other_env": 0.20871911942958832, "value_corner": 0.7631918787956238, "value_row": 0.2896355390548706, "value_any": 0.20871911942958832, "value_bot": 0.037938542664051056, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01360.png", "entropy": 0.10406937450170517} +{"ts": "2026-01-29T21:52:46.506251Z", "loop": 1365, "env_steps": 838656000, "exact_value_avg": 0.4393414556980133, "regret_dist": 0.36443594098091125, "regret_other_env": 0.6073554754257202, "regret_corner": 5.6603057601023465e-05, "regret_row": 0.4447265565395355, "regret_any": 0.6073554754257202, "regret_bot": 0.7590758800506592, "value_dist": 0.4393414556980133, "value_other_env": 0.22219766676425934, "value_corner": 0.7650571465492249, "value_row": 0.35196244716644287, "value_any": 0.22219766676425934, "value_bot": 0.03761318325996399, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01365.png", "entropy": 0.11257684230804443} +{"ts": "2026-01-29T21:52:52.370676Z", "loop": 1370, "env_steps": 841728000, "exact_value_avg": 0.44058629870414734, "regret_dist": 0.36319106817245483, "regret_other_env": 0.6052937507629395, "regret_corner": 3.702193862409331e-05, "regret_row": 0.4257383346557617, "regret_any": 0.6052937507629395, "regret_bot": 0.7603662610054016, "value_dist": 0.44058629870414734, "value_other_env": 0.22425933182239532, "value_corner": 0.7650766968727112, "value_row": 0.37095075845718384, "value_any": 0.22425933182239532, "value_bot": 0.036322712898254395, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01370.png", "entropy": 0.1239037811756134} +{"ts": "2026-01-29T21:52:58.217320Z", "loop": 1375, "env_steps": 844800000, "exact_value_avg": 0.4398289918899536, "regret_dist": 0.36394837498664856, "regret_other_env": 0.6065459251403809, "regret_corner": 5.2011513616889715e-05, "regret_row": 0.4143940210342407, "regret_any": 0.6065459251403809, "regret_bot": 0.7622344493865967, "value_dist": 0.4398289918899536, "value_other_env": 0.22300712764263153, "value_corner": 0.7650617361068726, "value_row": 0.38229504227638245, "value_any": 0.22300712764263153, "value_bot": 0.034454621374607086, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01375.png", "entropy": 0.12765945494174957} +{"ts": "2026-01-29T21:53:04.059518Z", "loop": 1380, "env_steps": 847872000, "exact_value_avg": 0.4406176209449768, "regret_dist": 0.36315974593162537, "regret_other_env": 0.6052486896514893, "regret_corner": 2.632240648381412e-05, "regret_row": 0.434944748878479, "regret_any": 0.6052486896514893, "regret_bot": 0.7594678401947021, "value_dist": 0.4406176209449768, "value_other_env": 0.22430437803268433, "value_corner": 0.7650874257087708, "value_row": 0.3617442548274994, "value_any": 0.22430437803268433, "value_bot": 0.03722120076417923, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01380.png", "entropy": 0.11090512573719025} +{"ts": "2026-01-29T21:53:09.910272Z", "loop": 1385, "env_steps": 850944000, "exact_value_avg": 0.43938785791397095, "regret_dist": 0.36438947916030884, "regret_other_env": 0.6072985529899597, "regret_corner": 2.5819243091973476e-05, "regret_row": 0.44629916548728943, "regret_any": 0.6072985529899597, "regret_bot": 0.7590370774269104, "value_dist": 0.43938785791397095, "value_other_env": 0.22225446999073029, "value_corner": 0.765087902545929, "value_row": 0.35038986802101135, "value_any": 0.22225446999073029, "value_bot": 0.037651970982551575, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01385.png", "entropy": 0.10028429329395294} +{"ts": "2026-01-29T21:53:15.772266Z", "loop": 1390, "env_steps": 854016000, "exact_value_avg": 0.4409973621368408, "regret_dist": 0.3627799451351166, "regret_other_env": 0.604619026184082, "regret_corner": 2.13235634873854e-05, "regret_row": 0.42735570669174194, "regret_any": 0.604619026184082, "regret_bot": 0.7604551315307617, "value_dist": 0.4409973621368408, "value_other_env": 0.22493402659893036, "value_corner": 0.7650923728942871, "value_row": 0.3693333566188812, "value_any": 0.22493402659893036, "value_bot": 0.036233894526958466, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01390.png", "entropy": 0.10958448797464371} +{"ts": "2026-01-29T21:53:21.636456Z", "loop": 1395, "env_steps": 857088000, "exact_value_avg": 0.4410594403743744, "regret_dist": 0.36271795630455017, "regret_other_env": 0.6045173406600952, "regret_corner": 1.882910873973742e-05, "regret_row": 0.4325145184993744, "regret_any": 0.6045173406600952, "regret_bot": 0.7596642971038818, "value_dist": 0.4410594403743744, "value_other_env": 0.22503574192523956, "value_corner": 0.7650949358940125, "value_row": 0.3641745150089264, "value_any": 0.22503574192523956, "value_bot": 0.037024758756160736, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01395.png", "entropy": 0.10574463754892349} +{"ts": "2026-01-29T21:53:27.484363Z", "loop": 1400, "env_steps": 860160000, "exact_value_avg": 0.4395793676376343, "regret_dist": 0.3641980290412903, "regret_other_env": 0.6069804430007935, "regret_corner": 2.435495662211906e-05, "regret_row": 0.4479992389678955, "regret_any": 0.6069804430007935, "regret_bot": 0.7589613199234009, "value_dist": 0.4395793676376343, "value_other_env": 0.2225726991891861, "value_corner": 0.7650893926620483, "value_row": 0.34868982434272766, "value_any": 0.2225726991891861, "value_bot": 0.0377277247607708, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01400.png", "entropy": 0.09760525822639465} +{"ts": "2026-01-29T21:53:33.330022Z", "loop": 1405, "env_steps": 863232000, "exact_value_avg": 0.4374222755432129, "regret_dist": 0.36635512113571167, "regret_other_env": 0.6105456948280334, "regret_corner": 6.921192107256502e-05, "regret_row": 0.4676949083805084, "regret_any": 0.6105456948280334, "regret_bot": 0.7587978839874268, "value_dist": 0.4374222755432129, "value_other_env": 0.21900740265846252, "value_corner": 0.7650445103645325, "value_row": 0.32899412512779236, "value_any": 0.21900740265846252, "value_bot": 0.037891194224357605, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01405.png", "entropy": 0.09482049196958542} +{"ts": "2026-01-29T21:53:39.179966Z", "loop": 1410, "env_steps": 866304000, "exact_value_avg": 0.43815651535987854, "regret_dist": 0.365620881319046, "regret_other_env": 0.6092990040779114, "regret_corner": 0.00010363361070631072, "regret_row": 0.46387746930122375, "regret_any": 0.6092990040779114, "regret_bot": 0.7588270306587219, "value_dist": 0.43815651535987854, "value_other_env": 0.2202540934085846, "value_corner": 0.7650101184844971, "value_row": 0.33281150460243225, "value_any": 0.2202540934085846, "value_bot": 0.03786208853125572, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01410.png", "entropy": 0.09933826327323914} +{"ts": "2026-01-29T21:53:45.032659Z", "loop": 1415, "env_steps": 869376000, "exact_value_avg": 0.44173818826675415, "regret_dist": 0.3620392084121704, "regret_other_env": 0.6033744215965271, "regret_corner": 3.6364795960253105e-05, "regret_row": 0.43269234895706177, "regret_any": 0.6033744215965271, "regret_bot": 0.7592225074768066, "value_dist": 0.44173818826675415, "value_other_env": 0.22617867588996887, "value_corner": 0.7650773525238037, "value_row": 0.3639967143535614, "value_any": 0.22617867588996887, "value_bot": 0.03746649995446205, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01415.png", "entropy": 0.11040158569812775} +{"ts": "2026-01-29T21:53:50.880531Z", "loop": 1420, "env_steps": 872448000, "exact_value_avg": 0.44264131784439087, "regret_dist": 0.3611360490322113, "regret_other_env": 0.601871907711029, "regret_corner": 3.2267471397062764e-05, "regret_row": 0.4200330674648285, "regret_any": 0.601871907711029, "regret_bot": 0.759649932384491, "value_dist": 0.44264131784439087, "value_other_env": 0.22768118977546692, "value_corner": 0.7650814652442932, "value_row": 0.3766559958457947, "value_any": 0.22768118977546692, "value_bot": 0.0370391421020031, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01420.png", "entropy": 0.11692455410957336} +{"ts": "2026-01-29T21:53:56.731413Z", "loop": 1425, "env_steps": 875520000, "exact_value_avg": 0.44208186864852905, "regret_dist": 0.3616954982280731, "regret_other_env": 0.6027929782867432, "regret_corner": 4.927913687424734e-05, "regret_row": 0.4059259593486786, "regret_any": 0.6027929782867432, "regret_bot": 0.7613163590431213, "value_dist": 0.44208186864852905, "value_other_env": 0.226760134100914, "value_corner": 0.7650644779205322, "value_row": 0.3907630443572998, "value_any": 0.226760134100914, "value_bot": 0.03537267819046974, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01425.png", "entropy": 0.13030874729156494} +{"ts": "2026-01-29T21:54:02.577978Z", "loop": 1430, "env_steps": 878592000, "exact_value_avg": 0.44299930334091187, "regret_dist": 0.3607780933380127, "regret_other_env": 0.6012645959854126, "regret_corner": 4.829913450521417e-05, "regret_row": 0.41092661023139954, "regret_any": 0.6012645959854126, "regret_bot": 0.7600674629211426, "value_dist": 0.44299930334091187, "value_other_env": 0.22828854620456696, "value_corner": 0.7650654315948486, "value_row": 0.38576245307922363, "value_any": 0.22828854620456696, "value_bot": 0.03662155568599701, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01430.png", "entropy": 0.12752948701381683} +{"ts": "2026-01-29T21:54:08.421015Z", "loop": 1435, "env_steps": 881664000, "exact_value_avg": 0.443164587020874, "regret_dist": 0.36061280965805054, "regret_other_env": 0.600989043712616, "regret_corner": 4.8420828534290195e-05, "regret_row": 0.41235795617103577, "regret_any": 0.600989043712616, "regret_bot": 0.7598164677619934, "value_dist": 0.443164587020874, "value_other_env": 0.2285640686750412, "value_corner": 0.7650653123855591, "value_row": 0.3843311071395874, "value_any": 0.2285640686750412, "value_bot": 0.03687255084514618, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01435.png", "entropy": 0.12379254400730133} +{"ts": "2026-01-29T21:54:14.266549Z", "loop": 1440, "env_steps": 884736000, "exact_value_avg": 0.443215012550354, "regret_dist": 0.36056238412857056, "regret_other_env": 0.6009121537208557, "regret_corner": 3.769547038245946e-05, "regret_row": 0.40852978825569153, "regret_any": 0.6009121537208557, "regret_bot": 0.7601015567779541, "value_dist": 0.443215012550354, "value_other_env": 0.22864098846912384, "value_corner": 0.7650759816169739, "value_row": 0.38815924525260925, "value_any": 0.22864098846912384, "value_bot": 0.03658744692802429, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01440.png", "entropy": 0.12185998260974884} +{"ts": "2026-01-29T21:54:20.115205Z", "loop": 1445, "env_steps": 887808000, "exact_value_avg": 0.44347092509269714, "regret_dist": 0.3603065013885498, "regret_other_env": 0.6004860401153564, "regret_corner": 3.7158530176384374e-05, "regret_row": 0.4106721580028534, "regret_any": 0.6004860401153564, "regret_bot": 0.7597169280052185, "value_dist": 0.44347092509269714, "value_other_env": 0.2290671020746231, "value_corner": 0.7650766372680664, "value_row": 0.3860168755054474, "value_any": 0.2290671020746231, "value_bot": 0.03697211295366287, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01445.png", "entropy": 0.11788564175367355} +{"ts": "2026-01-29T21:54:25.958762Z", "loop": 1450, "env_steps": 890880000, "exact_value_avg": 0.44177621603012085, "regret_dist": 0.3620011508464813, "regret_other_env": 0.603288471698761, "regret_corner": 7.011394336586818e-05, "regret_row": 0.4372701942920685, "regret_any": 0.603288471698761, "regret_bot": 0.7589213848114014, "value_dist": 0.44177621603012085, "value_other_env": 0.2262645959854126, "value_corner": 0.7650436162948608, "value_row": 0.3594188690185547, "value_any": 0.2262645959854126, "value_bot": 0.03776765614748001, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01450.png", "entropy": 0.10340059548616409} +{"ts": "2026-01-29T21:54:31.807262Z", "loop": 1455, "env_steps": 893952000, "exact_value_avg": 0.44375354051589966, "regret_dist": 0.3600237965583801, "regret_other_env": 0.6000255942344666, "regret_corner": 2.108365333697293e-05, "regret_row": 0.41111207008361816, "regret_any": 0.6000255942344666, "regret_bot": 0.7596864700317383, "value_dist": 0.44375354051589966, "value_other_env": 0.22952748835086823, "value_corner": 0.7650926113128662, "value_row": 0.385576993227005, "value_any": 0.22952748835086823, "value_bot": 0.03700251132249832, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01455.png", "entropy": 0.10966868698596954} +{"ts": "2026-01-29T21:54:37.652458Z", "loop": 1460, "env_steps": 897024000, "exact_value_avg": 0.44348254799842834, "regret_dist": 0.36029481887817383, "regret_other_env": 0.6004740595817566, "regret_corner": 2.5890769393299706e-05, "regret_row": 0.4058254659175873, "regret_any": 0.6004740595817566, "regret_bot": 0.7608198523521423, "value_dist": 0.44348254799842834, "value_other_env": 0.22907902300357819, "value_corner": 0.7650877833366394, "value_row": 0.3908635675907135, "value_any": 0.22907902300357819, "value_bot": 0.03586916998028755, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01460.png", "entropy": 0.11237568408250809} +{"ts": "2026-01-29T21:54:43.492657Z", "loop": 1465, "env_steps": 900096000, "exact_value_avg": 0.44396233558654785, "regret_dist": 0.3598150312900543, "regret_other_env": 0.5996780395507812, "regret_corner": 2.0467243302846327e-05, "regret_row": 0.4075663685798645, "regret_any": 0.5996780395507812, "regret_bot": 0.7599160671234131, "value_dist": 0.44396233558654785, "value_other_env": 0.22987505793571472, "value_corner": 0.7650932669639587, "value_row": 0.38912269473075867, "value_any": 0.22987505793571472, "value_bot": 0.036772988736629486, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01465.png", "entropy": 0.10843489319086075} +{"ts": "2026-01-29T21:54:49.339335Z", "loop": 1470, "env_steps": 903168000, "exact_value_avg": 0.44147491455078125, "regret_dist": 0.36230242252349854, "regret_other_env": 0.6037943363189697, "regret_corner": 6.45071268081665e-05, "regret_row": 0.4024023711681366, "regret_any": 0.6037943363189697, "regret_bot": 0.7628628611564636, "value_dist": 0.44147491455078125, "value_other_env": 0.22575871646404266, "value_corner": 0.7650492191314697, "value_row": 0.3942866921424866, "value_any": 0.22575871646404266, "value_bot": 0.033826183527708054, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01470.png", "entropy": 0.12052525579929352} +{"ts": "2026-01-29T21:54:55.183879Z", "loop": 1475, "env_steps": 906240000, "exact_value_avg": 0.4442884922027588, "regret_dist": 0.3594888746738434, "regret_other_env": 0.5991267561912537, "regret_corner": 3.202011430403218e-05, "regret_row": 0.40729978680610657, "regret_any": 0.5991267561912537, "regret_bot": 0.7597439289093018, "value_dist": 0.4442884922027588, "value_other_env": 0.23042632639408112, "value_corner": 0.7650817036628723, "value_row": 0.3893892467021942, "value_any": 0.23042632639408112, "value_bot": 0.03694510832428932, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01475.png", "entropy": 0.11222842335700989} +{"ts": "2026-01-29T21:55:01.028553Z", "loop": 1480, "env_steps": 909312000, "exact_value_avg": 0.4407433867454529, "regret_dist": 0.3630339503288269, "regret_other_env": 0.6047475337982178, "regret_corner": 0.00046355926315300167, "regret_row": 0.4474194049835205, "regret_any": 0.6047475337982178, "regret_bot": 0.7588689923286438, "value_dist": 0.4407433867454529, "value_other_env": 0.2248055636882782, "value_corner": 0.7646501064300537, "value_row": 0.3492695987224579, "value_any": 0.2248055636882782, "value_bot": 0.037820056080818176, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01480.png", "entropy": 0.10496312379837036} +{"ts": "2026-01-29T21:55:06.876325Z", "loop": 1485, "env_steps": 912384000, "exact_value_avg": 0.44179296493530273, "regret_dist": 0.3619844615459442, "regret_other_env": 0.6030758023262024, "regret_corner": 0.00034741064882837236, "regret_row": 0.4381118714809418, "regret_any": 0.6030758023262024, "regret_bot": 0.7590116262435913, "value_dist": 0.44179296493530273, "value_other_env": 0.22647733986377716, "value_corner": 0.7647663354873657, "value_row": 0.3585771918296814, "value_any": 0.22647733986377716, "value_bot": 0.03767740726470947, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01485.png", "entropy": 0.11015166342258453} +{"ts": "2026-01-29T21:55:12.725659Z", "loop": 1490, "env_steps": 915456000, "exact_value_avg": 0.4428041875362396, "regret_dist": 0.36097320914268494, "regret_other_env": 0.6015653610229492, "regret_corner": 8.49500356707722e-05, "regret_row": 0.4027291238307953, "regret_any": 0.6015653610229492, "regret_bot": 0.7621963024139404, "value_dist": 0.4428041875362396, "value_other_env": 0.22798776626586914, "value_corner": 0.7650287747383118, "value_row": 0.3939599096775055, "value_any": 0.22798776626586914, "value_bot": 0.03449275717139244, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01490.png", "entropy": 0.13077358901500702} +{"ts": "2026-01-29T21:55:18.568588Z", "loop": 1495, "env_steps": 918528000, "exact_value_avg": 0.43710529804229736, "regret_dist": 0.3666720986366272, "regret_other_env": 0.6104442477226257, "regret_corner": 0.0010138422949239612, "regret_row": 0.39250195026397705, "regret_any": 0.6104442477226257, "regret_bot": 0.7664669156074524, "value_dist": 0.43710529804229736, "value_other_env": 0.21910886466503143, "value_corner": 0.7640998959541321, "value_row": 0.40418708324432373, "value_any": 0.21910886466503143, "value_bot": 0.030222130939364433, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01495.png", "entropy": 0.13979290425777435} +{"ts": "2026-01-29T21:55:24.411774Z", "loop": 1500, "env_steps": 921600000, "exact_value_avg": 0.44339990615844727, "regret_dist": 0.3603774905204773, "regret_other_env": 0.600594699382782, "regret_corner": 5.1607195928227156e-05, "regret_row": 0.4023231267929077, "regret_any": 0.600594699382782, "regret_bot": 0.7621485590934753, "value_dist": 0.44339990615844727, "value_other_env": 0.228958398103714, "value_corner": 0.7650620937347412, "value_row": 0.39436593651771545, "value_any": 0.228958398103714, "value_bot": 0.03454047441482544, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01500.png", "entropy": 0.11985305696725845} +{"ts": "2026-01-29T21:55:30.254787Z", "loop": 1505, "env_steps": 924672000, "exact_value_avg": 0.443756103515625, "regret_dist": 0.3600212633609772, "regret_other_env": 0.6000142693519592, "regret_corner": 3.1775238312548026e-05, "regret_row": 0.4225963056087494, "regret_any": 0.6000142693519592, "regret_bot": 0.7589177489280701, "value_dist": 0.443756103515625, "value_other_env": 0.22953885793685913, "value_corner": 0.7650819420814514, "value_row": 0.3740927278995514, "value_any": 0.22953885793685913, "value_bot": 0.03777128830552101, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01505.png", "entropy": 0.09198374301195145} +{"ts": "2026-01-29T21:55:36.100036Z", "loop": 1510, "env_steps": 927744000, "exact_value_avg": 0.4404680132865906, "regret_dist": 0.363309383392334, "regret_other_env": 0.6054680347442627, "regret_corner": 7.140189700294286e-05, "regret_row": 0.45690834522247314, "regret_any": 0.6054680347442627, "regret_bot": 0.7587085366249084, "value_dist": 0.4404680132865906, "value_other_env": 0.22408509254455566, "value_corner": 0.7650423645973206, "value_row": 0.33978068828582764, "value_any": 0.22408509254455566, "value_bot": 0.03798048198223114, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01510.png", "entropy": 0.08417382836341858} +{"ts": "2026-01-29T21:55:41.943057Z", "loop": 1515, "env_steps": 930816000, "exact_value_avg": 0.4418751001358032, "regret_dist": 0.36190226674079895, "regret_other_env": 0.6031452417373657, "regret_corner": 3.7799280107719824e-05, "regret_row": 0.4431654214859009, "regret_any": 0.6031452417373657, "regret_bot": 0.75874924659729, "value_dist": 0.4418751001358032, "value_other_env": 0.22640781104564667, "value_corner": 0.7650759816169739, "value_row": 0.3535236120223999, "value_any": 0.22640781104564667, "value_bot": 0.037939753383398056, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01515.png", "entropy": 0.08368492871522903} +{"ts": "2026-01-29T21:55:47.789671Z", "loop": 1520, "env_steps": 933888000, "exact_value_avg": 0.4450559914112091, "regret_dist": 0.35872140526771545, "regret_other_env": 0.5978603363037109, "regret_corner": 1.2965997484570835e-05, "regret_row": 0.4069846272468567, "regret_any": 0.5978603363037109, "regret_bot": 0.7595264315605164, "value_dist": 0.4450559914112091, "value_other_env": 0.23169277608394623, "value_corner": 0.7651007771492004, "value_row": 0.38970446586608887, "value_any": 0.23169277608394623, "value_bot": 0.03716259449720383, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01520.png", "entropy": 0.0941961258649826} +{"ts": "2026-01-29T21:55:53.640034Z", "loop": 1525, "env_steps": 936960000, "exact_value_avg": 0.4437490701675415, "regret_dist": 0.36002832651138306, "regret_other_env": 0.6000312566757202, "regret_corner": 2.3897986466181464e-05, "regret_row": 0.4020567834377289, "regret_any": 0.6000312566757202, "regret_bot": 0.7626938819885254, "value_dist": 0.4437490701675415, "value_other_env": 0.22952185571193695, "value_corner": 0.7650898098945618, "value_row": 0.3946322798728943, "value_any": 0.22952185571193695, "value_bot": 0.03399519994854927, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01525.png", "entropy": 0.10594509541988373} +{"ts": "2026-01-29T21:55:59.484157Z", "loop": 1530, "env_steps": 940032000, "exact_value_avg": 0.4450894296169281, "regret_dist": 0.35868796706199646, "regret_other_env": 0.5978027582168579, "regret_corner": 1.5685956896049902e-05, "regret_row": 0.4033668637275696, "regret_any": 0.5978027582168579, "regret_bot": 0.7606075406074524, "value_dist": 0.4450894296169281, "value_other_env": 0.23175033926963806, "value_corner": 0.7650980353355408, "value_row": 0.3933221995830536, "value_any": 0.23175033926963806, "value_bot": 0.03608150780200958, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01530.png", "entropy": 0.10012073069810867} +{"ts": "2026-01-29T21:56:05.327472Z", "loop": 1535, "env_steps": 943104000, "exact_value_avg": 0.445049524307251, "regret_dist": 0.3587278127670288, "regret_other_env": 0.5978691577911377, "regret_corner": 1.580864227435086e-05, "regret_row": 0.41037240624427795, "regret_any": 0.5978691577911377, "regret_bot": 0.7590243816375732, "value_dist": 0.445049524307251, "value_other_env": 0.23168392479419708, "value_corner": 0.765097975730896, "value_row": 0.3863166570663452, "value_any": 0.23168392479419708, "value_bot": 0.03766464442014694, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01535.png", "entropy": 0.08984581381082535} +{"ts": "2026-01-29T21:56:11.169912Z", "loop": 1540, "env_steps": 946176000, "exact_value_avg": 0.4413180351257324, "regret_dist": 0.36245933175086975, "regret_other_env": 0.6040215492248535, "regret_corner": 0.00011602094309637323, "regret_row": 0.4499271512031555, "regret_any": 0.6040215492248535, "regret_bot": 0.7586835026741028, "value_dist": 0.4413180351257324, "value_other_env": 0.22553156316280365, "value_corner": 0.764997661113739, "value_row": 0.3467618525028229, "value_any": 0.22553156316280365, "value_bot": 0.03800548240542412, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01540.png", "entropy": 0.08315938711166382} +{"ts": "2026-01-29T21:56:17.011325Z", "loop": 1545, "env_steps": 949248000, "exact_value_avg": 0.437187135219574, "regret_dist": 0.3665902018547058, "regret_other_env": 0.6105280518531799, "regret_corner": 0.000683389138430357, "regret_row": 0.4937208890914917, "regret_any": 0.6105280518531799, "regret_bot": 0.7586508989334106, "value_dist": 0.437187135219574, "value_other_env": 0.21902498602867126, "value_corner": 0.7644303441047668, "value_row": 0.30296817421913147, "value_any": 0.21902498602867126, "value_bot": 0.038038220256567, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01545.png", "entropy": 0.08247052133083344} +{"ts": "2026-01-29T21:56:22.852505Z", "loop": 1550, "env_steps": 952320000, "exact_value_avg": 0.44351011514663696, "regret_dist": 0.3602672219276428, "regret_other_env": 0.6003829836845398, "regret_corner": 9.36041324166581e-05, "regret_row": 0.4297884702682495, "regret_any": 0.6003829836845398, "regret_bot": 0.7587732076644897, "value_dist": 0.44351011514663696, "value_other_env": 0.22917009890079498, "value_corner": 0.7650201320648193, "value_row": 0.36690059304237366, "value_any": 0.22917009890079498, "value_bot": 0.03791585937142372, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01550.png", "entropy": 0.08822322636842728} +{"ts": "2026-01-29T21:56:28.701481Z", "loop": 1555, "env_steps": 955392000, "exact_value_avg": 0.44571709632873535, "regret_dist": 0.35806024074554443, "regret_other_env": 0.5967497229576111, "regret_corner": 2.599756044219248e-05, "regret_row": 0.40337708592414856, "regret_any": 0.5967497229576111, "regret_bot": 0.7602668404579163, "value_dist": 0.44571709632873535, "value_other_env": 0.2328033298254013, "value_corner": 0.7650876641273499, "value_row": 0.3933119773864746, "value_any": 0.2328033298254013, "value_bot": 0.03642221540212631, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01555.png", "entropy": 0.10620345920324326} +{"ts": "2026-01-29T21:56:34.550071Z", "loop": 1560, "env_steps": 958464000, "exact_value_avg": 0.4421249032020569, "regret_dist": 0.3616524338722229, "regret_other_env": 0.6026537418365479, "regret_corner": 0.00015046249609440565, "regret_row": 0.3920325040817261, "regret_any": 0.6026537418365479, "regret_bot": 0.7632922530174255, "value_dist": 0.4421249032020569, "value_other_env": 0.22689934074878693, "value_corner": 0.7649632692337036, "value_row": 0.4046564996242523, "value_any": 0.22689934074878693, "value_bot": 0.033396847546100616, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01560.png", "entropy": 0.12434791773557663} +{"ts": "2026-01-29T21:56:40.398552Z", "loop": 1565, "env_steps": 961536000, "exact_value_avg": 0.4445425271987915, "regret_dist": 0.3592347800731659, "regret_other_env": 0.598690927028656, "regret_corner": 5.054573557572439e-05, "regret_row": 0.3989178240299225, "regret_any": 0.598690927028656, "regret_bot": 0.7615930438041687, "value_dist": 0.4445425271987915, "value_other_env": 0.23086215555667877, "value_corner": 0.7650631070137024, "value_row": 0.3977712392807007, "value_any": 0.23086215555667877, "value_bot": 0.03509601205587387, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01565.png", "entropy": 0.11589596420526505} +{"ts": "2026-01-29T21:56:46.254840Z", "loop": 1570, "env_steps": 964608000, "exact_value_avg": 0.4458276927471161, "regret_dist": 0.3579496741294861, "regret_other_env": 0.5965575575828552, "regret_corner": 3.782709609367885e-05, "regret_row": 0.4094756841659546, "regret_any": 0.5965575575828552, "regret_bot": 0.7591302394866943, "value_dist": 0.4458276927471161, "value_other_env": 0.23299553990364075, "value_corner": 0.7650759220123291, "value_row": 0.3872133195400238, "value_any": 0.23299553990364075, "value_bot": 0.037558816373348236, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01570.png", "entropy": 0.09757673740386963} +{"ts": "2026-01-29T21:56:52.100644Z", "loop": 1575, "env_steps": 967680000, "exact_value_avg": 0.4445421099662781, "regret_dist": 0.3592352271080017, "regret_other_env": 0.5986720323562622, "regret_corner": 8.005351264728233e-05, "regret_row": 0.42181992530822754, "regret_any": 0.5986720323562622, "regret_bot": 0.7588323950767517, "value_dist": 0.4445421099662781, "value_other_env": 0.230881005525589, "value_corner": 0.7650337219238281, "value_row": 0.37486910820007324, "value_any": 0.230881005525589, "value_bot": 0.03785661607980728, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01575.png", "entropy": 0.09130201488733292} +{"ts": "2026-01-29T21:56:57.965584Z", "loop": 1580, "env_steps": 970752000, "exact_value_avg": 0.4461139142513275, "regret_dist": 0.35766348242759705, "regret_other_env": 0.596091091632843, "regret_corner": 2.2087991965236142e-05, "regret_row": 0.40637075901031494, "regret_any": 0.596091091632843, "regret_bot": 0.7592599987983704, "value_dist": 0.4461139142513275, "value_other_env": 0.23346205055713654, "value_corner": 0.7650916576385498, "value_row": 0.39031827449798584, "value_any": 0.23346205055713654, "value_bot": 0.03742901608347893, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01580.png", "entropy": 0.09467598050832748} +{"ts": "2026-01-29T21:57:03.819327Z", "loop": 1585, "env_steps": 973824000, "exact_value_avg": 0.4462716281414032, "regret_dist": 0.35750579833984375, "regret_other_env": 0.5958309173583984, "regret_corner": 1.807461194403004e-05, "regret_row": 0.40478450059890747, "regret_any": 0.5958309173583984, "regret_bot": 0.7594693303108215, "value_dist": 0.4462716281414032, "value_other_env": 0.23372222483158112, "value_corner": 0.7650957107543945, "value_row": 0.3919045925140381, "value_any": 0.23372222483158112, "value_bot": 0.037219684571027756, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01585.png", "entropy": 0.09396544843912125} +{"ts": "2026-01-29T21:57:09.674607Z", "loop": 1590, "env_steps": 976896000, "exact_value_avg": 0.4462689757347107, "regret_dist": 0.3575083911418915, "regret_other_env": 0.5958349704742432, "regret_corner": 1.8469991118763573e-05, "regret_row": 0.4023727774620056, "regret_any": 0.5958349704742432, "regret_bot": 0.7602400183677673, "value_dist": 0.4462689757347107, "value_other_env": 0.2337181270122528, "value_corner": 0.7650952935218811, "value_row": 0.39431628584861755, "value_any": 0.2337181270122528, "value_bot": 0.03644898161292076, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01590.png", "entropy": 0.09864103049039841} +{"ts": "2026-01-29T21:57:15.519868Z", "loop": 1595, "env_steps": 979968000, "exact_value_avg": 0.4464288651943207, "regret_dist": 0.3573484718799591, "regret_other_env": 0.5955693125724792, "regret_corner": 1.722325941955205e-05, "regret_row": 0.402743935585022, "regret_any": 0.5955693125724792, "regret_bot": 0.759946882724762, "value_dist": 0.4464288651943207, "value_other_env": 0.23398378491401672, "value_corner": 0.7650964856147766, "value_row": 0.3939451277256012, "value_any": 0.23398378491401672, "value_bot": 0.03674215450882912, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01595.png", "entropy": 0.09640919417142868} +{"ts": "2026-01-29T21:57:21.374359Z", "loop": 1600, "env_steps": 983040000, "exact_value_avg": 0.44646644592285156, "regret_dist": 0.357310950756073, "regret_other_env": 0.5955061912536621, "regret_corner": 1.8010041458182968e-05, "regret_row": 0.4022151529788971, "regret_any": 0.5955061912536621, "regret_bot": 0.7602154612541199, "value_dist": 0.44646644592285156, "value_other_env": 0.23404687643051147, "value_corner": 0.7650957703590393, "value_row": 0.3944739103317261, "value_any": 0.23404687643051147, "value_bot": 0.036473583430051804, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01600.png", "entropy": 0.09657220542430878} +{"ts": "2026-01-29T21:57:27.217025Z", "loop": 1605, "env_steps": 986112000, "exact_value_avg": 0.44346556067466736, "regret_dist": 0.3603118360042572, "regret_other_env": 0.6004896759986877, "regret_corner": 4.508545316639356e-05, "regret_row": 0.3943943679332733, "regret_any": 0.6004896759986877, "regret_bot": 0.7641122341156006, "value_dist": 0.44346556067466736, "value_other_env": 0.2290634661912918, "value_corner": 0.7650686502456665, "value_row": 0.40229466557502747, "value_any": 0.2290634661912918, "value_bot": 0.0325767956674099, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01605.png", "entropy": 0.10728591680526733} +{"ts": "2026-01-29T21:57:33.064319Z", "loop": 1610, "env_steps": 989184000, "exact_value_avg": 0.4445902109146118, "regret_dist": 0.35918718576431274, "regret_other_env": 0.5986284017562866, "regret_corner": 2.5352339434903115e-05, "regret_row": 0.39820241928100586, "regret_any": 0.5986284017562866, "regret_bot": 0.7635495662689209, "value_dist": 0.4445902109146118, "value_other_env": 0.23092474043369293, "value_corner": 0.7650883793830872, "value_row": 0.3984866440296173, "value_any": 0.23092474043369293, "value_bot": 0.03313944488763809, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01610.png", "entropy": 0.10075165331363678} +{"ts": "2026-01-29T21:57:38.908083Z", "loop": 1615, "env_steps": 992256000, "exact_value_avg": 0.44545120000839233, "regret_dist": 0.35832616686820984, "regret_other_env": 0.5972046852111816, "regret_corner": 8.345147762156557e-06, "regret_row": 0.41095954179763794, "regret_any": 0.5972046852111816, "regret_bot": 0.7589156627655029, "value_dist": 0.44545120000839233, "value_other_env": 0.23234841227531433, "value_corner": 0.7651054263114929, "value_row": 0.38572949171066284, "value_any": 0.23234841227531433, "value_bot": 0.037773460149765015, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01615.png", "entropy": 0.07642515748739243} +{"ts": "2026-01-29T21:57:44.756512Z", "loop": 1620, "env_steps": 995328000, "exact_value_avg": 0.4436112344264984, "regret_dist": 0.36016613245010376, "regret_other_env": 0.6002678275108337, "regret_corner": 1.3551613847084809e-05, "regret_row": 0.4302448630332947, "regret_any": 0.6002678275108337, "regret_bot": 0.7587108016014099, "value_dist": 0.4436112344264984, "value_other_env": 0.22928525507450104, "value_corner": 0.7651001811027527, "value_row": 0.3664442300796509, "value_any": 0.22928525507450104, "value_bot": 0.03797823563218117, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01620.png", "entropy": 0.07110713422298431} +{"ts": "2026-01-29T21:57:50.599853Z", "loop": 1625, "env_steps": 998400000, "exact_value_avg": 0.44446322321891785, "regret_dist": 0.35931411385536194, "regret_other_env": 0.5988501906394958, "regret_corner": 1.0012090569944121e-05, "regret_row": 0.4212440252304077, "regret_any": 0.5988501906394958, "regret_bot": 0.758756160736084, "value_dist": 0.44446322321891785, "value_other_env": 0.23070290684700012, "value_corner": 0.7651036977767944, "value_row": 0.37544506788253784, "value_any": 0.23070290684700012, "value_bot": 0.0379328615963459, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01625.png", "entropy": 0.0722079873085022} +{"ts": "2026-01-29T21:57:56.444540Z", "loop": 1630, "env_steps": 1001472000, "exact_value_avg": 0.44558969140052795, "regret_dist": 0.3581876754760742, "regret_other_env": 0.5969730615615845, "regret_corner": 9.510915333521552e-06, "regret_row": 0.410484254360199, "regret_any": 0.5969730615615845, "regret_bot": 0.758881688117981, "value_dist": 0.44558969140052795, "value_other_env": 0.2325800061225891, "value_corner": 0.7651042342185974, "value_row": 0.3862047791481018, "value_any": 0.2325800061225891, "value_bot": 0.0378074087202549, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01630.png", "entropy": 0.07620091736316681} +{"ts": "2026-01-29T21:58:02.292961Z", "loop": 1635, "env_steps": 1004544000, "exact_value_avg": 0.4461977779865265, "regret_dist": 0.35757964849472046, "regret_other_env": 0.5959586501121521, "regret_corner": 1.1123717740701977e-05, "regret_row": 0.4065413475036621, "regret_any": 0.5959586501121521, "regret_bot": 0.7590265870094299, "value_dist": 0.4461977779865265, "value_other_env": 0.23359446227550507, "value_corner": 0.7651026844978333, "value_row": 0.39014771580696106, "value_any": 0.23359446227550507, "value_bot": 0.03766241297125816, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01635.png", "entropy": 0.08032503724098206} +{"ts": "2026-01-29T21:58:08.136295Z", "loop": 1640, "env_steps": 1007616000, "exact_value_avg": 0.4469867944717407, "regret_dist": 0.35679054260253906, "regret_other_env": 0.5946406126022339, "regret_corner": 1.545250415802002e-05, "regret_row": 0.40079382061958313, "regret_any": 0.5946406126022339, "regret_bot": 0.7602266669273376, "value_dist": 0.4469867944717407, "value_other_env": 0.2349124699831009, "value_corner": 0.7650982737541199, "value_row": 0.3958952724933624, "value_any": 0.2349124699831009, "value_bot": 0.03646242991089821, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01640.png", "entropy": 0.09123510867357254} +{"ts": "2026-01-29T21:58:13.981486Z", "loop": 1645, "env_steps": 1010688000, "exact_value_avg": 0.4469863474369049, "regret_dist": 0.35679104924201965, "regret_other_env": 0.5946399569511414, "regret_corner": 1.768469883245416e-05, "regret_row": 0.39933282136917114, "regret_any": 0.5946399569511414, "regret_bot": 0.7608510255813599, "value_dist": 0.4469863474369049, "value_other_env": 0.234913170337677, "value_corner": 0.7650960683822632, "value_row": 0.397356241941452, "value_any": 0.234913170337677, "value_bot": 0.035838089883327484, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01645.png", "entropy": 0.09339694678783417} +{"ts": "2026-01-29T21:58:19.837432Z", "loop": 1650, "env_steps": 1013760000, "exact_value_avg": 0.4469852149486542, "regret_dist": 0.3567921817302704, "regret_other_env": 0.5946430563926697, "regret_corner": 1.5864770830376074e-05, "regret_row": 0.40375426411628723, "regret_any": 0.5946430563926697, "regret_bot": 0.7593748569488525, "value_dist": 0.4469852149486542, "value_other_env": 0.23491008579730988, "value_corner": 0.7650978565216064, "value_row": 0.39293479919433594, "value_any": 0.23491008579730988, "value_bot": 0.03731418773531914, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01650.png", "entropy": 0.08508435636758804} +{"ts": "2026-01-29T21:58:25.686959Z", "loop": 1655, "env_steps": 1016832000, "exact_value_avg": 0.441835880279541, "regret_dist": 0.36194145679473877, "regret_other_env": 0.60308837890625, "regret_corner": 0.00022109052224550396, "regret_row": 0.45429742336273193, "regret_any": 0.60308837890625, "regret_bot": 0.7586724162101746, "value_dist": 0.441835880279541, "value_other_env": 0.22646473348140717, "value_corner": 0.7648926377296448, "value_row": 0.3423916697502136, "value_any": 0.22646473348140717, "value_bot": 0.03801662474870682, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01655.png", "entropy": 0.07893604785203934} +{"ts": "2026-01-29T21:58:31.541684Z", "loop": 1660, "env_steps": 1019904000, "exact_value_avg": 0.44632774591445923, "regret_dist": 0.35744959115982056, "regret_other_env": 0.5957324504852295, "regret_corner": 2.5227171136066318e-05, "regret_row": 0.4106943607330322, "regret_any": 0.5957324504852295, "regret_bot": 0.7588927745819092, "value_dist": 0.44632774591445923, "value_other_env": 0.2338205873966217, "value_corner": 0.7650884985923767, "value_row": 0.38599467277526855, "value_any": 0.2338205873966217, "value_bot": 0.03779618814587593, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01660.png", "entropy": 0.08338556438684464} +{"ts": "2026-01-29T21:58:37.391034Z", "loop": 1665, "env_steps": 1022976000, "exact_value_avg": 0.4475065767765045, "regret_dist": 0.35627079010009766, "regret_other_env": 0.5937578082084656, "regret_corner": 4.026740862173028e-05, "regret_row": 0.391405314207077, "regret_any": 0.5937578082084656, "regret_bot": 0.761310338973999, "value_dist": 0.4475065767765045, "value_other_env": 0.235795259475708, "value_corner": 0.7650734782218933, "value_row": 0.40528377890586853, "value_any": 0.235795259475708, "value_bot": 0.035378679633140564, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01665.png", "entropy": 0.10286853462457657} +{"ts": "2026-01-29T21:58:43.235739Z", "loop": 1670, "env_steps": 1026048000, "exact_value_avg": 0.4473768472671509, "regret_dist": 0.3564004898071289, "regret_other_env": 0.5939732193946838, "regret_corner": 4.133334005018696e-05, "regret_row": 0.39059725403785706, "regret_any": 0.5939732193946838, "regret_bot": 0.7617915272712708, "value_dist": 0.4473768472671509, "value_other_env": 0.23557983338832855, "value_corner": 0.7650724053382874, "value_row": 0.4060918390750885, "value_any": 0.23557983338832855, "value_bot": 0.034897491335868835, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01670.png", "entropy": 0.10239941626787186} +{"ts": "2026-01-29T21:58:49.081215Z", "loop": 1675, "env_steps": 1029120000, "exact_value_avg": 0.4473697543144226, "regret_dist": 0.35640764236450195, "regret_other_env": 0.5939943194389343, "regret_corner": 2.7593474442255683e-05, "regret_row": 0.39285412430763245, "regret_any": 0.5939943194389343, "regret_bot": 0.7616180777549744, "value_dist": 0.4473697543144226, "value_other_env": 0.23555879294872284, "value_corner": 0.7650861740112305, "value_row": 0.4038349390029907, "value_any": 0.23555879294872284, "value_bot": 0.03507097810506821, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01675.png", "entropy": 0.09604351222515106} +{"ts": "2026-01-29T21:58:54.923920Z", "loop": 1680, "env_steps": 1032192000, "exact_value_avg": 0.4472976326942444, "regret_dist": 0.3564797341823578, "regret_other_env": 0.594110906124115, "regret_corner": 3.289630330982618e-05, "regret_row": 0.3903314769268036, "regret_any": 0.594110906124115, "regret_bot": 0.762086033821106, "value_dist": 0.4472976326942444, "value_other_env": 0.235442116856575, "value_corner": 0.7650808691978455, "value_row": 0.40635761618614197, "value_any": 0.235442116856575, "value_bot": 0.03460300341248512, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01680.png", "entropy": 0.09720059484243393} +{"ts": "2026-01-29T21:59:00.771163Z", "loop": 1685, "env_steps": 1035264000, "exact_value_avg": 0.4469503164291382, "regret_dist": 0.3568269908428192, "regret_other_env": 0.5946776270866394, "regret_corner": 5.106429671286605e-05, "regret_row": 0.3871627151966095, "regret_any": 0.5946776270866394, "regret_bot": 0.762695848941803, "value_dist": 0.4469503164291382, "value_other_env": 0.23487542569637299, "value_corner": 0.7650626301765442, "value_row": 0.4095263183116913, "value_any": 0.23487542569637299, "value_bot": 0.0339931957423687, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01685.png", "entropy": 0.10057634115219116} +{"ts": "2026-01-29T21:59:06.623072Z", "loop": 1690, "env_steps": 1038336000, "exact_value_avg": 0.4398917257785797, "regret_dist": 0.36388567090034485, "regret_other_env": 0.6056234836578369, "regret_corner": 0.0012788837775588036, "regret_row": 0.378583163022995, "regret_any": 0.6056234836578369, "regret_bot": 0.7671611905097961, "value_dist": 0.4398917257785797, "value_other_env": 0.22392956912517548, "value_corner": 0.7638349533081055, "value_row": 0.4181058704853058, "value_any": 0.22392956912517548, "value_bot": 0.02952784299850464, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01690.png", "entropy": 0.11822815239429474} +{"ts": "2026-01-29T21:59:12.476710Z", "loop": 1695, "env_steps": 1041408000, "exact_value_avg": 0.4477863311767578, "regret_dist": 0.35599103569984436, "regret_other_env": 0.593295156955719, "regret_corner": 3.478875078144483e-05, "regret_row": 0.38836470246315, "regret_any": 0.593295156955719, "regret_bot": 0.7614073753356934, "value_dist": 0.4477863311767578, "value_other_env": 0.2362579107284546, "value_corner": 0.7650789618492126, "value_row": 0.40832436084747314, "value_any": 0.2362579107284546, "value_bot": 0.03528163209557533, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01695.png", "entropy": 0.09409641474485397} +{"ts": "2026-01-29T21:59:18.325912Z", "loop": 1700, "env_steps": 1044480000, "exact_value_avg": 0.4475817084312439, "regret_dist": 0.3561956286430359, "regret_other_env": 0.5936530232429504, "regret_corner": 9.52829941525124e-06, "regret_row": 0.40159425139427185, "regret_any": 0.5936530232429504, "regret_bot": 0.7590455412864685, "value_dist": 0.4475817084312439, "value_other_env": 0.23590001463890076, "value_corner": 0.7651042342185974, "value_row": 0.39509478211402893, "value_any": 0.23590001463890076, "value_bot": 0.037643514573574066, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01700.png", "entropy": 0.07805044203996658} +{"ts": "2026-01-29T21:59:24.175108Z", "loop": 1705, "env_steps": 1047552000, "exact_value_avg": 0.44668513536453247, "regret_dist": 0.3570922911167145, "regret_other_env": 0.5951437950134277, "regret_corner": 1.4949839169275947e-05, "regret_row": 0.4080345630645752, "regret_any": 0.5951437950134277, "regret_bot": 0.7587703466415405, "value_dist": 0.44668513536453247, "value_other_env": 0.23440934717655182, "value_corner": 0.7650988101959229, "value_row": 0.3886544704437256, "value_any": 0.23440934717655182, "value_bot": 0.03791869431734085, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01705.png", "entropy": 0.07540421932935715} +{"ts": "2026-01-29T21:59:30.021731Z", "loop": 1710, "env_steps": 1050624000, "exact_value_avg": 0.4459403157234192, "regret_dist": 0.3578370213508606, "regret_other_env": 0.5963727235794067, "regret_corner": 3.342529453220777e-05, "regret_row": 0.4139752686023712, "regret_any": 0.5963727235794067, "regret_bot": 0.7587153315544128, "value_dist": 0.4459403157234192, "value_other_env": 0.23318032920360565, "value_corner": 0.7650802731513977, "value_row": 0.38271376490592957, "value_any": 0.23318032920360565, "value_bot": 0.03797367587685585, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01710.png", "entropy": 0.07653677463531494} +{"ts": "2026-01-29T21:59:35.865703Z", "loop": 1715, "env_steps": 1053696000, "exact_value_avg": 0.4465717077255249, "regret_dist": 0.35720571875572205, "regret_other_env": 0.5953193306922913, "regret_corner": 3.52571441908367e-05, "regret_row": 0.4103538691997528, "regret_any": 0.5953193306922913, "regret_bot": 0.758791446685791, "value_dist": 0.4465717077255249, "value_other_env": 0.2342337667942047, "value_corner": 0.7650785446166992, "value_row": 0.38633519411087036, "value_any": 0.2342337667942047, "value_bot": 0.037897542119026184, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01715.png", "entropy": 0.07978053390979767} +{"ts": "2026-01-29T21:59:41.721662Z", "loop": 1720, "env_steps": 1056768000, "exact_value_avg": 0.4476061463356018, "regret_dist": 0.35617125034332275, "regret_other_env": 0.5936060547828674, "regret_corner": 1.8995007849298418e-05, "regret_row": 0.40343835949897766, "regret_any": 0.5936060547828674, "regret_bot": 0.7590356469154358, "value_dist": 0.4476061463356018, "value_other_env": 0.23594708740711212, "value_corner": 0.7650947570800781, "value_row": 0.3932507336139679, "value_any": 0.23594708740711212, "value_bot": 0.037653371691703796, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01720.png", "entropy": 0.08168623596429825} +{"ts": "2026-01-29T21:59:47.579147Z", "loop": 1725, "env_steps": 1059840000, "exact_value_avg": 0.4469950497150421, "regret_dist": 0.35678234696388245, "regret_other_env": 0.5946153998374939, "regret_corner": 3.271699097240344e-05, "regret_row": 0.40920379757881165, "regret_any": 0.5946153998374939, "regret_bot": 0.7588911056518555, "value_dist": 0.4469950497150421, "value_other_env": 0.23493771255016327, "value_corner": 0.7650810480117798, "value_row": 0.38748523592948914, "value_any": 0.23493771255016327, "value_bot": 0.03779793158173561, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01725.png", "entropy": 0.08276735991239548} +{"ts": "2026-01-29T21:59:53.425912Z", "loop": 1730, "env_steps": 1062912000, "exact_value_avg": 0.4479999244213104, "regret_dist": 0.35577747225761414, "regret_other_env": 0.5929431915283203, "regret_corner": 2.883921297325287e-05, "regret_row": 0.40223008394241333, "regret_any": 0.5929431915283203, "regret_bot": 0.7591435313224792, "value_dist": 0.4479999244213104, "value_other_env": 0.23660992085933685, "value_corner": 0.7650849223136902, "value_row": 0.39445897936820984, "value_any": 0.23660992085933685, "value_bot": 0.037545498460531235, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01730.png", "entropy": 0.08789939433336258} +{"ts": "2026-01-29T21:59:59.268954Z", "loop": 1735, "env_steps": 1065984000, "exact_value_avg": 0.44859403371810913, "regret_dist": 0.35518333315849304, "regret_other_env": 0.5919491648674011, "regret_corner": 3.4588578273542225e-05, "regret_row": 0.3982263505458832, "regret_any": 0.5919491648674011, "regret_bot": 0.759360671043396, "value_dist": 0.44859403371810913, "value_other_env": 0.23760393261909485, "value_corner": 0.765079140663147, "value_row": 0.3984627425670624, "value_any": 0.23760393261909485, "value_bot": 0.03732837364077568, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01735.png", "entropy": 0.09303630888462067} +{"ts": "2026-01-29T22:00:05.110745Z", "loop": 1740, "env_steps": 1069056000, "exact_value_avg": 0.44928497076034546, "regret_dist": 0.3544923961162567, "regret_other_env": 0.5907837748527527, "regret_corner": 5.526592576643452e-05, "regret_row": 0.3931030035018921, "regret_any": 0.5907837748527527, "regret_bot": 0.759877622127533, "value_dist": 0.44928497076034546, "value_other_env": 0.2387693077325821, "value_corner": 0.7650584578514099, "value_row": 0.4035860300064087, "value_any": 0.2387693077325821, "value_bot": 0.03681141883134842, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01740.png", "entropy": 0.10313766449689865} +{"ts": "2026-01-29T22:00:10.953766Z", "loop": 1745, "env_steps": 1072128000, "exact_value_avg": 0.4496985971927643, "regret_dist": 0.35407882928848267, "regret_other_env": 0.5900164246559143, "regret_corner": 0.00017237316933460534, "regret_row": 0.382457435131073, "regret_any": 0.5900164246559143, "regret_bot": 0.7613021731376648, "value_dist": 0.4496985971927643, "value_other_env": 0.23953670263290405, "value_corner": 0.764941394329071, "value_row": 0.41423162817955017, "value_any": 0.23953670263290405, "value_bot": 0.03538687154650688, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01745.png", "entropy": 0.12547317147254944} +{"ts": "2026-01-29T22:00:16.799712Z", "loop": 1750, "env_steps": 1075200000, "exact_value_avg": 0.43934935331344604, "regret_dist": 0.36442801356315613, "regret_other_env": 0.6007125377655029, "regret_corner": 0.010001189075410366, "regret_row": 0.3706604838371277, "regret_any": 0.6007125377655029, "regret_bot": 0.7654693722724915, "value_dist": 0.43934935331344604, "value_other_env": 0.22884051501750946, "value_corner": 0.7551125884056091, "value_row": 0.4260285794734955, "value_any": 0.22884051501750946, "value_bot": 0.031219692900776863, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01750.png", "entropy": 0.1801324039697647} +{"ts": "2026-01-29T22:00:22.645164Z", "loop": 1755, "env_steps": 1078272000, "exact_value_avg": 0.44940242171287537, "regret_dist": 0.3543749153614044, "regret_other_env": 0.5904456973075867, "regret_corner": 0.00026870620786212385, "regret_row": 0.3775803744792938, "regret_any": 0.5904456973075867, "regret_bot": 0.7618756890296936, "value_dist": 0.44940242171287537, "value_other_env": 0.23910731077194214, "value_corner": 0.764845073223114, "value_row": 0.41910865902900696, "value_any": 0.23910731077194214, "value_bot": 0.034813400357961655, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01755.png", "entropy": 0.1289266049861908} +{"ts": "2026-01-29T22:00:28.496766Z", "loop": 1760, "env_steps": 1081344000, "exact_value_avg": 0.44808951020240784, "regret_dist": 0.35568782687187195, "regret_other_env": 0.5927708745002747, "regret_corner": 6.324698915705085e-05, "regret_row": 0.4040640592575073, "regret_any": 0.5927708745002747, "regret_bot": 0.7591175436973572, "value_dist": 0.44808951020240784, "value_other_env": 0.23678217828273773, "value_corner": 0.76505047082901, "value_row": 0.39262500405311584, "value_any": 0.23678217828273773, "value_bot": 0.03757154196500778, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01760.png", "entropy": 0.0922825038433075} +{"ts": "2026-01-29T22:00:34.347347Z", "loop": 1765, "env_steps": 1084416000, "exact_value_avg": 0.4466678500175476, "regret_dist": 0.35710951685905457, "regret_other_env": 0.5951118469238281, "regret_corner": 0.0001060058712027967, "regret_row": 0.41682496666908264, "regret_any": 0.5951118469238281, "regret_bot": 0.7588561773300171, "value_dist": 0.4466678500175476, "value_other_env": 0.23444129526615143, "value_corner": 0.7650076746940613, "value_row": 0.3798640966415405, "value_any": 0.23444129526615143, "value_bot": 0.037832848727703094, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01765.png", "entropy": 0.08791031688451767} +{"ts": "2026-01-29T22:00:40.197916Z", "loop": 1770, "env_steps": 1087488000, "exact_value_avg": 0.4499657452106476, "regret_dist": 0.353811651468277, "regret_other_env": 0.5896584391593933, "regret_corner": 4.14485766668804e-05, "regret_row": 0.3864940404891968, "regret_any": 0.5896584391593933, "regret_bot": 0.7604907155036926, "value_dist": 0.4499657452106476, "value_other_env": 0.23989467322826385, "value_corner": 0.7650722861289978, "value_row": 0.410194993019104, "value_any": 0.23989467322826385, "value_bot": 0.03619832172989845, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01770.png", "entropy": 0.09698723256587982} +{"ts": "2026-01-29T22:00:46.048343Z", "loop": 1775, "env_steps": 1090560000, "exact_value_avg": 0.44811105728149414, "regret_dist": 0.35566630959510803, "regret_other_env": 0.5925557017326355, "regret_corner": 0.0003322094853501767, "regret_row": 0.3723885118961334, "regret_any": 0.5925557017326355, "regret_bot": 0.7628180980682373, "value_dist": 0.44811105728149414, "value_other_env": 0.23699742555618286, "value_corner": 0.7647815346717834, "value_row": 0.42430052161216736, "value_any": 0.23699742555618286, "value_bot": 0.03387096896767616, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01775.png", "entropy": 0.11601350456476212} +{"ts": "2026-01-29T22:00:51.895591Z", "loop": 1780, "env_steps": 1093632000, "exact_value_avg": 0.4493538737297058, "regret_dist": 0.35442355275154114, "regret_other_env": 0.5906939506530762, "regret_corner": 1.7926098735188134e-05, "regret_row": 0.3925861120223999, "regret_any": 0.5906939506530762, "regret_bot": 0.7594578266143799, "value_dist": 0.4493538737297058, "value_other_env": 0.238859161734581, "value_corner": 0.7650958299636841, "value_row": 0.40410295128822327, "value_any": 0.238859161734581, "value_bot": 0.0372312031686306, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01780.png", "entropy": 0.08352754265069962} +{"ts": "2026-01-29T22:00:57.740314Z", "loop": 1785, "env_steps": 1096704000, "exact_value_avg": 0.4459601938724518, "regret_dist": 0.357817143201828, "regret_other_env": 0.5963325500488281, "regret_corner": 4.4057273044018075e-05, "regret_row": 0.422494500875473, "regret_any": 0.5963325500488281, "regret_bot": 0.7587183117866516, "value_dist": 0.4459601938724518, "value_other_env": 0.23322054743766785, "value_corner": 0.7650696039199829, "value_row": 0.37419456243515015, "value_any": 0.23322054743766785, "value_bot": 0.03797077760100365, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01785.png", "entropy": 0.07704135030508041} +{"ts": "2026-01-29T22:01:03.585771Z", "loop": 1790, "env_steps": 1099776000, "exact_value_avg": 0.4467361867427826, "regret_dist": 0.3570411801338196, "regret_other_env": 0.5950503349304199, "regret_corner": 2.7419628167990595e-05, "regret_row": 0.41588106751441956, "regret_any": 0.5950503349304199, "regret_bot": 0.7587529420852661, "value_dist": 0.4467361867427826, "value_other_env": 0.23450273275375366, "value_corner": 0.76508629322052, "value_row": 0.380808025598526, "value_any": 0.23450273275375366, "value_bot": 0.03793611750006676, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01790.png", "entropy": 0.0766235813498497} +{"ts": "2026-01-29T22:01:09.430958Z", "loop": 1795, "env_steps": 1102848000, "exact_value_avg": 0.44898277521133423, "regret_dist": 0.35479459166526794, "regret_other_env": 0.5913127660751343, "regret_corner": 1.72600157384295e-05, "regret_row": 0.39664435386657715, "regret_any": 0.5913127660751343, "regret_bot": 0.7591118812561035, "value_dist": 0.44898277521133423, "value_other_env": 0.23824027180671692, "value_corner": 0.7650964260101318, "value_row": 0.400044709444046, "value_any": 0.23824027180671692, "value_bot": 0.03757719323039055, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01795.png", "entropy": 0.08029205352067947} +{"ts": "2026-01-29T22:01:15.282568Z", "loop": 1800, "env_steps": 1105920000, "exact_value_avg": 0.44896769523620605, "regret_dist": 0.3548096716403961, "regret_other_env": 0.5913331508636475, "regret_corner": 2.4404625946772285e-05, "regret_row": 0.39872047305107117, "regret_any": 0.5913331508636475, "regret_bot": 0.7590543627738953, "value_dist": 0.44896769523620605, "value_other_env": 0.23821991682052612, "value_corner": 0.7650893330574036, "value_row": 0.397968590259552, "value_any": 0.23821991682052612, "value_bot": 0.03763464465737343, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01800.png", "entropy": 0.08383078128099442} +{"ts": "2026-01-29T22:01:21.133724Z", "loop": 1805, "env_steps": 1108992000, "exact_value_avg": 0.4501238465309143, "regret_dist": 0.35365352034568787, "regret_other_env": 0.5894030332565308, "regret_corner": 2.9188893677201122e-05, "regret_row": 0.38941866159439087, "regret_any": 0.5894030332565308, "regret_bot": 0.7596026659011841, "value_dist": 0.4501238465309143, "value_other_env": 0.24015004932880402, "value_corner": 0.7650845646858215, "value_row": 0.4072703719139099, "value_any": 0.24015004932880402, "value_bot": 0.03708641231060028, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01805.png", "entropy": 0.08948618173599243} +{"ts": "2026-01-29T22:01:26.974438Z", "loop": 1810, "env_steps": 1112064000, "exact_value_avg": 0.4486146867275238, "regret_dist": 0.35516270995140076, "regret_other_env": 0.5916552543640137, "regret_corner": 0.00042388690053485334, "regret_row": 0.36977532505989075, "regret_any": 0.5916552543640137, "regret_bot": 0.7626248002052307, "value_dist": 0.4486146867275238, "value_other_env": 0.2378978729248047, "value_corner": 0.7646898627281189, "value_row": 0.42691370844841003, "value_any": 0.2378978729248047, "value_bot": 0.03406422212719917, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01810.png", "entropy": 0.12044728547334671} +{"ts": "2026-01-29T22:01:32.823220Z", "loop": 1815, "env_steps": 1115136000, "exact_value_avg": 0.45037078857421875, "regret_dist": 0.3534066081047058, "regret_other_env": 0.5889685153961182, "regret_corner": 6.367763126036152e-05, "regret_row": 0.3740524649620056, "regret_any": 0.5889685153961182, "regret_bot": 0.7616105079650879, "value_dist": 0.45037078857421875, "value_other_env": 0.2405846267938614, "value_corner": 0.7650500535964966, "value_row": 0.4226365387439728, "value_any": 0.2405846267938614, "value_bot": 0.035078518092632294, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01815.png", "entropy": 0.09933093935251236} +{"ts": "2026-01-29T22:01:38.670701Z", "loop": 1820, "env_steps": 1118208000, "exact_value_avg": 0.45027339458465576, "regret_dist": 0.3535040020942688, "regret_other_env": 0.5891584157943726, "regret_corner": 2.233982195321005e-05, "regret_row": 0.3836200535297394, "regret_any": 0.5891584157943726, "regret_bot": 0.7605268955230713, "value_dist": 0.45027339458465576, "value_other_env": 0.2403946816921234, "value_corner": 0.7650913596153259, "value_row": 0.4130690097808838, "value_any": 0.2403946816921234, "value_bot": 0.036162108182907104, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01820.png", "entropy": 0.08517665416002274} +{"ts": "2026-01-29T22:01:44.519698Z", "loop": 1825, "env_steps": 1121280000, "exact_value_avg": 0.4496920108795166, "regret_dist": 0.3540852963924408, "regret_other_env": 0.5901336669921875, "regret_corner": 1.2749930647260044e-05, "regret_row": 0.39043816924095154, "regret_any": 0.5901336669921875, "regret_bot": 0.7593288421630859, "value_dist": 0.4496920108795166, "value_other_env": 0.23941941559314728, "value_corner": 0.7651009559631348, "value_row": 0.40625080466270447, "value_any": 0.23941941559314728, "value_bot": 0.03736024349927902, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01825.png", "entropy": 0.07708054780960083} +{"ts": "2026-01-29T22:01:50.360688Z", "loop": 1830, "env_steps": 1124352000, "exact_value_avg": 0.45020270347595215, "regret_dist": 0.3535746932029724, "regret_other_env": 0.589277982711792, "regret_corner": 1.9780796719715e-05, "regret_row": 0.3843030333518982, "regret_any": 0.589277982711792, "regret_bot": 0.7604020237922668, "value_dist": 0.45020270347595215, "value_other_env": 0.24027512967586517, "value_corner": 0.765093982219696, "value_row": 0.4123860001564026, "value_any": 0.24027512967586517, "value_bot": 0.036287084221839905, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01830.png", "entropy": 0.0832216665148735} +{"ts": "2026-01-29T22:01:56.208078Z", "loop": 1835, "env_steps": 1127424000, "exact_value_avg": 0.45044392347335815, "regret_dist": 0.3533335030078888, "regret_other_env": 0.5888704657554626, "regret_corner": 2.798189780151006e-05, "regret_row": 0.3794066309928894, "regret_any": 0.5888704657554626, "regret_bot": 0.7610339522361755, "value_dist": 0.45044392347335815, "value_other_env": 0.2406827211380005, "value_corner": 0.765085756778717, "value_row": 0.41728246212005615, "value_any": 0.2406827211380005, "value_bot": 0.03565508499741554, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01835.png", "entropy": 0.08838104456663132} +{"ts": "2026-01-29T22:02:02.061498Z", "loop": 1840, "env_steps": 1130496000, "exact_value_avg": 0.45043033361434937, "regret_dist": 0.3533470034599304, "regret_other_env": 0.5888986587524414, "regret_corner": 1.9516051906975918e-05, "regret_row": 0.38382163643836975, "regret_any": 0.5888986587524414, "regret_bot": 0.7602267265319824, "value_dist": 0.45043033361434937, "value_other_env": 0.2406543642282486, "value_corner": 0.7650942206382751, "value_row": 0.41286739706993103, "value_any": 0.2406543642282486, "value_bot": 0.03646231070160866, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01840.png", "entropy": 0.08295942097902298} +{"ts": "2026-01-29T22:02:07.906222Z", "loop": 1845, "env_steps": 1133568000, "exact_value_avg": 0.4495755434036255, "regret_dist": 0.3542018234729767, "regret_other_env": 0.5903278589248657, "regret_corner": 1.2708704161923379e-05, "regret_row": 0.3930564522743225, "regret_any": 0.5903278589248657, "regret_bot": 0.7591328620910645, "value_dist": 0.4495755434036255, "value_other_env": 0.23922523856163025, "value_corner": 0.7651010155677795, "value_row": 0.40363261103630066, "value_any": 0.23922523856163025, "value_bot": 0.03755620867013931, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01845.png", "entropy": 0.07638575881719589} +{"ts": "2026-01-29T22:02:13.748729Z", "loop": 1850, "env_steps": 1136640000, "exact_value_avg": 0.4494500756263733, "regret_dist": 0.35432732105255127, "regret_other_env": 0.5905367732048035, "regret_corner": 1.3101102013024502e-05, "regret_row": 0.39504602551460266, "regret_any": 0.5905367732048035, "regret_bot": 0.759052574634552, "value_dist": 0.4494500756263733, "value_other_env": 0.2390163391828537, "value_corner": 0.7651006579399109, "value_row": 0.4016430377960205, "value_any": 0.2390163391828537, "value_bot": 0.03763642534613609, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01850.png", "entropy": 0.07635416090488434} +{"ts": "2026-01-29T22:02:19.591986Z", "loop": 1855, "env_steps": 1139712000, "exact_value_avg": 0.4508037865161896, "regret_dist": 0.3529735505580902, "regret_other_env": 0.5882740020751953, "regret_corner": 2.2905072910361923e-05, "regret_row": 0.37985995411872864, "regret_any": 0.5882740020751953, "regret_bot": 0.7604748010635376, "value_dist": 0.4508037865161896, "value_other_env": 0.24127903580665588, "value_corner": 0.7650908827781677, "value_row": 0.41682907938957214, "value_any": 0.24127903580665588, "value_bot": 0.03621428459882736, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01855.png", "entropy": 0.08462425321340561} +{"ts": "2026-01-29T22:02:25.441525Z", "loop": 1860, "env_steps": 1142784000, "exact_value_avg": 0.4500617980957031, "regret_dist": 0.3537156283855438, "regret_other_env": 0.5894649624824524, "regret_corner": 9.15606869966723e-05, "regret_row": 0.3695280849933624, "regret_any": 0.5894649624824524, "regret_bot": 0.7628466486930847, "value_dist": 0.4500617980957031, "value_other_env": 0.24008813500404358, "value_corner": 0.7650222182273865, "value_row": 0.42716100811958313, "value_any": 0.24008813500404358, "value_bot": 0.03384235501289368, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01860.png", "entropy": 0.1052272617816925} +{"ts": "2026-01-29T22:02:31.286326Z", "loop": 1865, "env_steps": 1145856000, "exact_value_avg": 0.45117396116256714, "regret_dist": 0.35260340571403503, "regret_other_env": 0.5876383781433105, "regret_corner": 5.0921742513310164e-05, "regret_row": 0.3710100054740906, "regret_any": 0.5876383781433105, "regret_bot": 0.7615035176277161, "value_dist": 0.45117396116256714, "value_other_env": 0.24191471934318542, "value_corner": 0.7650628089904785, "value_row": 0.4256790578365326, "value_any": 0.24191471934318542, "value_bot": 0.03518550470471382, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01865.png", "entropy": 0.09570187330245972} +{"ts": "2026-01-29T22:02:37.138619Z", "loop": 1870, "env_steps": 1148928000, "exact_value_avg": 0.45117637515068054, "regret_dist": 0.352601021528244, "regret_other_env": 0.5876524448394775, "regret_corner": 2.382596539973747e-05, "regret_row": 0.37957918643951416, "regret_any": 0.5876524448394775, "regret_bot": 0.7598962783813477, "value_dist": 0.45117637515068054, "value_other_env": 0.24190066754817963, "value_corner": 0.7650899291038513, "value_row": 0.4171098470687866, "value_any": 0.24190066754817963, "value_bot": 0.03679275885224342, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01870.png", "entropy": 0.08428508043289185} +{"ts": "2026-01-29T22:02:42.982325Z", "loop": 1875, "env_steps": 1152000000, "exact_value_avg": 0.45142507553100586, "regret_dist": 0.3523522913455963, "regret_other_env": 0.5872344970703125, "regret_corner": 2.899269384215586e-05, "regret_row": 0.37695199251174927, "regret_any": 0.5872344970703125, "regret_bot": 0.760003387928009, "value_dist": 0.45142507553100586, "value_other_env": 0.24231858551502228, "value_corner": 0.7650847434997559, "value_row": 0.4197370409965515, "value_any": 0.24231858551502228, "value_bot": 0.03668569400906563, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01875.png", "entropy": 0.08662200719118118} +{"ts": "2026-01-29T22:02:48.824541Z", "loop": 1880, "env_steps": 1155072000, "exact_value_avg": 0.4515916109085083, "regret_dist": 0.35218578577041626, "regret_other_env": 0.586930513381958, "regret_corner": 6.868243508506566e-05, "regret_row": 0.3708994388580322, "regret_any": 0.586930513381958, "regret_bot": 0.7610129117965698, "value_dist": 0.4515916109085083, "value_other_env": 0.24262258410453796, "value_corner": 0.7650451064109802, "value_row": 0.42578959465026855, "value_any": 0.24262258410453796, "value_bot": 0.03567615523934364, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01880.png", "entropy": 0.09856147319078445} +{"ts": "2026-01-29T22:02:54.668743Z", "loop": 1885, "env_steps": 1158144000, "exact_value_avg": 0.45029905438423157, "regret_dist": 0.353478342294693, "regret_other_env": 0.5889390110969543, "regret_corner": 0.0002872889454010874, "regret_row": 0.36876171827316284, "regret_any": 0.5889390110969543, "regret_bot": 0.7620965838432312, "value_dist": 0.45029905438423157, "value_other_env": 0.24061410129070282, "value_corner": 0.7648264765739441, "value_row": 0.42792725563049316, "value_any": 0.24061410129070282, "value_bot": 0.03459245339035988, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01885.png", "entropy": 0.11526892334222794} +{"ts": "2026-01-29T22:03:00.516367Z", "loop": 1890, "env_steps": 1161216000, "exact_value_avg": 0.4507821202278137, "regret_dist": 0.3529953062534332, "regret_other_env": 0.5881891250610352, "regret_corner": 0.00020450950250960886, "regret_row": 0.369124174118042, "regret_any": 0.5881891250610352, "regret_bot": 0.7618010640144348, "value_dist": 0.4507821202278137, "value_other_env": 0.24136395752429962, "value_corner": 0.7649092674255371, "value_row": 0.4275648593902588, "value_any": 0.24136395752429962, "value_bot": 0.03488800674676895, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01890.png", "entropy": 0.11114213615655899} +{"ts": "2026-01-29T22:03:06.365967Z", "loop": 1895, "env_steps": 1164288000, "exact_value_avg": 0.45129162073135376, "regret_dist": 0.3524857759475708, "regret_other_env": 0.5873995423316956, "regret_corner": 0.00011510402691783383, "regret_row": 0.36940351128578186, "regret_any": 0.5873995423316956, "regret_bot": 0.7614945769309998, "value_dist": 0.45129162073135376, "value_other_env": 0.24215354025363922, "value_corner": 0.7649986743927002, "value_row": 0.4272855818271637, "value_any": 0.24215354025363922, "value_bot": 0.03519446402788162, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01895.png", "entropy": 0.10301302373409271} +{"ts": "2026-01-29T22:03:12.226465Z", "loop": 1900, "env_steps": 1167360000, "exact_value_avg": 0.45181503891944885, "regret_dist": 0.3519623577594757, "regret_other_env": 0.5865811109542847, "regret_corner": 3.4183762181783095e-05, "regret_row": 0.3713557720184326, "regret_any": 0.5865811109542847, "regret_bot": 0.7606327533721924, "value_dist": 0.45181503891944885, "value_other_env": 0.2429720163345337, "value_corner": 0.7650795578956604, "value_row": 0.42533326148986816, "value_any": 0.2429720163345337, "value_bot": 0.0360562764108181, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01900.png", "entropy": 0.08659788966178894} +{"ts": "2026-01-29T22:03:18.073487Z", "loop": 1905, "env_steps": 1170432000, "exact_value_avg": 0.4511953592300415, "regret_dist": 0.35258200764656067, "regret_other_env": 0.587620735168457, "regret_corner": 2.388854954915587e-05, "regret_row": 0.3817417323589325, "regret_any": 0.587620735168457, "regret_bot": 0.7594414949417114, "value_dist": 0.4511953592300415, "value_other_env": 0.24193237721920013, "value_corner": 0.7650898098945618, "value_row": 0.4149473011493683, "value_any": 0.24193237721920013, "value_bot": 0.037247560918331146, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01905.png", "entropy": 0.07950378954410553} +{"ts": "2026-01-29T22:03:23.918300Z", "loop": 1910, "env_steps": 1173504000, "exact_value_avg": 0.4506482481956482, "regret_dist": 0.353129118680954, "regret_other_env": 0.5884803533554077, "regret_corner": 0.00010222048149444163, "regret_row": 0.38821399211883545, "regret_any": 0.5884803533554077, "regret_bot": 0.7592301368713379, "value_dist": 0.4506482481956482, "value_other_env": 0.24107269942760468, "value_corner": 0.7650114893913269, "value_row": 0.40847504138946533, "value_any": 0.24107269942760468, "value_bot": 0.0374588817358017, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01910.png", "entropy": 0.08438766747713089} +{"ts": "2026-01-29T22:03:29.765615Z", "loop": 1915, "env_steps": 1176576000, "exact_value_avg": 0.4514300227165222, "regret_dist": 0.35234737396240234, "regret_other_env": 0.5871871709823608, "regret_corner": 8.764068479649723e-05, "regret_row": 0.3789955675601959, "regret_any": 0.5871871709823608, "regret_bot": 0.7598103880882263, "value_dist": 0.4514300227165222, "value_other_env": 0.24236591160297394, "value_corner": 0.7650260925292969, "value_row": 0.41769346594810486, "value_any": 0.24236591160297394, "value_bot": 0.03687865287065506, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01915.png", "entropy": 0.08986559510231018} +{"ts": "2026-01-29T22:03:35.617192Z", "loop": 1920, "env_steps": 1179648000, "exact_value_avg": 0.4481947422027588, "regret_dist": 0.3555826246738434, "regret_other_env": 0.5917124152183533, "regret_corner": 0.001387919532135129, "regret_row": 0.36639878153800964, "regret_any": 0.5917124152183533, "regret_bot": 0.7629139423370361, "value_dist": 0.4481947422027588, "value_other_env": 0.2378406822681427, "value_corner": 0.7637258172035217, "value_row": 0.4302903115749359, "value_any": 0.2378406822681427, "value_bot": 0.03377506881952286, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01920.png", "entropy": 0.1332658976316452} +{"ts": "2026-01-29T22:03:41.464987Z", "loop": 1925, "env_steps": 1182720000, "exact_value_avg": 0.44855618476867676, "regret_dist": 0.3552212119102478, "regret_other_env": 0.5914043188095093, "regret_corner": 0.0009465133771300316, "regret_row": 0.36636465787887573, "regret_any": 0.5914043188095093, "regret_bot": 0.7630282044410706, "value_dist": 0.44855618476867676, "value_other_env": 0.2381487935781479, "value_corner": 0.7641671895980835, "value_row": 0.43032437562942505, "value_any": 0.2381487935781479, "value_bot": 0.03366081789135933, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01925.png", "entropy": 0.1267540603876114} +{"ts": "2026-01-29T22:03:47.312276Z", "loop": 1930, "env_steps": 1185792000, "exact_value_avg": 0.4516429305076599, "regret_dist": 0.35213443636894226, "regret_other_env": 0.5868684649467468, "regret_corner": 3.339449904160574e-05, "regret_row": 0.36982080340385437, "regret_any": 0.5868684649467468, "regret_bot": 0.761234700679779, "value_dist": 0.4516429305076599, "value_other_env": 0.24268458783626556, "value_corner": 0.7650803923606873, "value_row": 0.4268682301044464, "value_any": 0.24268458783626556, "value_bot": 0.035454344004392624, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01930.png", "entropy": 0.08681140840053558} +{"ts": "2026-01-29T22:03:53.160279Z", "loop": 1935, "env_steps": 1188864000, "exact_value_avg": 0.45118045806884766, "regret_dist": 0.3525969386100769, "regret_other_env": 0.5876431465148926, "regret_corner": 2.7539830625755712e-05, "regret_row": 0.3697635531425476, "regret_any": 0.5876431465148926, "regret_bot": 0.7618839740753174, "value_dist": 0.45118045806884766, "value_other_env": 0.24190998077392578, "value_corner": 0.7650861740112305, "value_row": 0.4269254505634308, "value_any": 0.24190998077392578, "value_bot": 0.034805089235305786, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01935.png", "entropy": 0.08528953045606613} +{"ts": "2026-01-29T22:03:59.005537Z", "loop": 1940, "env_steps": 1191936000, "exact_value_avg": 0.45127058029174805, "regret_dist": 0.3525067865848541, "regret_other_env": 0.5874996185302734, "regret_corner": 1.7526250303490087e-05, "regret_row": 0.37165921926498413, "regret_any": 0.5874996185302734, "regret_bot": 0.7612243890762329, "value_dist": 0.45127058029174805, "value_other_env": 0.2420535385608673, "value_corner": 0.7650961875915527, "value_row": 0.42502981424331665, "value_any": 0.2420535385608673, "value_bot": 0.035464681684970856, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01940.png", "entropy": 0.07917220145463943} +{"ts": "2026-01-29T22:04:04.851931Z", "loop": 1945, "env_steps": 1195008000, "exact_value_avg": 0.4503425359725952, "regret_dist": 0.35343489050865173, "regret_other_env": 0.589052140712738, "regret_corner": 8.98192411113996e-06, "regret_row": 0.3891783654689789, "regret_any": 0.589052140712738, "regret_bot": 0.7589625120162964, "value_dist": 0.4503425359725952, "value_other_env": 0.24050097167491913, "value_corner": 0.7651047706604004, "value_row": 0.4075106382369995, "value_any": 0.24050097167491913, "value_bot": 0.037726495414972305, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01945.png", "entropy": 0.06976927816867828} +{"ts": "2026-01-29T22:04:10.698997Z", "loop": 1950, "env_steps": 1198080000, "exact_value_avg": 0.44966423511505127, "regret_dist": 0.3541131913661957, "regret_other_env": 0.590181291103363, "regret_corner": 1.0990103874064516e-05, "regret_row": 0.39676928520202637, "regret_any": 0.590181291103363, "regret_bot": 0.7587729692459106, "value_dist": 0.44966423511505127, "value_other_env": 0.2393718659877777, "value_corner": 0.765102744102478, "value_row": 0.3999198079109192, "value_any": 0.2393718659877777, "value_bot": 0.037916116416454315, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01950.png", "entropy": 0.06991793215274811} +{"ts": "2026-01-29T22:04:16.550435Z", "loop": 1955, "env_steps": 1201152000, "exact_value_avg": 0.4500555396080017, "regret_dist": 0.35372185707092285, "regret_other_env": 0.5895265340805054, "regret_corner": 1.4816721886745654e-05, "regret_row": 0.3945675790309906, "regret_any": 0.5895265340805054, "regret_bot": 0.7588222622871399, "value_dist": 0.4500555396080017, "value_other_env": 0.240026593208313, "value_corner": 0.7650989294052124, "value_row": 0.4021214544773102, "value_any": 0.240026593208313, "value_bot": 0.037866801023483276, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01955.png", "entropy": 0.07146626710891724} +{"ts": "2026-01-29T22:04:22.399791Z", "loop": 1960, "env_steps": 1204224000, "exact_value_avg": 0.4498031735420227, "regret_dist": 0.35397422313690186, "regret_other_env": 0.5899277925491333, "regret_corner": 4.381090548122302e-05, "regret_row": 0.3989378809928894, "regret_any": 0.5899277925491333, "regret_bot": 0.7588108777999878, "value_dist": 0.4498031735420227, "value_other_env": 0.23962534964084625, "value_corner": 0.7650699019432068, "value_row": 0.39775121212005615, "value_any": 0.23962534964084625, "value_bot": 0.037878233939409256, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01960.png", "entropy": 0.07570448517799377} +{"ts": "2026-01-29T22:04:28.246061Z", "loop": 1965, "env_steps": 1207296000, "exact_value_avg": 0.45111313462257385, "regret_dist": 0.35266420245170593, "regret_other_env": 0.5877541303634644, "regret_corner": 2.930561822722666e-05, "regret_row": 0.3845156729221344, "regret_any": 0.5877541303634644, "regret_bot": 0.7591810822486877, "value_dist": 0.45111313462257385, "value_other_env": 0.24179893732070923, "value_corner": 0.7650843858718872, "value_row": 0.4121733605861664, "value_any": 0.24179893732070923, "value_bot": 0.03750797361135483, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01965.png", "entropy": 0.07726074010133743} +{"ts": "2026-01-29T22:04:34.096966Z", "loop": 1970, "env_steps": 1210368000, "exact_value_avg": 0.451995849609375, "regret_dist": 0.35178154706954956, "regret_other_env": 0.5862813591957092, "regret_corner": 3.185023888363503e-05, "regret_row": 0.3742246925830841, "regret_any": 0.5862813591957092, "regret_bot": 0.7600158452987671, "value_dist": 0.451995849609375, "value_other_env": 0.24327179789543152, "value_corner": 0.7650818228721619, "value_row": 0.4224643409252167, "value_any": 0.24327179789543152, "value_bot": 0.036673229187726974, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01970.png", "entropy": 0.08331914246082306} +{"ts": "2026-01-29T22:04:39.950666Z", "loop": 1975, "env_steps": 1213440000, "exact_value_avg": 0.45072585344314575, "regret_dist": 0.3530515134334564, "regret_other_env": 0.588248074054718, "regret_corner": 0.0002566988405305892, "regret_row": 0.36759668588638306, "regret_any": 0.588248074054718, "regret_bot": 0.761773407459259, "value_dist": 0.45072585344314575, "value_other_env": 0.24130509793758392, "value_corner": 0.7648569941520691, "value_row": 0.4290924072265625, "value_any": 0.24130509793758392, "value_bot": 0.034915629774332047, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01975.png", "entropy": 0.11271712929010391} +{"ts": "2026-01-29T22:04:45.802550Z", "loop": 1980, "env_steps": 1216512000, "exact_value_avg": 0.4516823887825012, "regret_dist": 0.35209500789642334, "regret_other_env": 0.5867685675621033, "regret_corner": 8.46684051794e-05, "regret_row": 0.3690779209136963, "regret_any": 0.5867685675621033, "regret_bot": 0.7612863779067993, "value_dist": 0.4516823887825012, "value_other_env": 0.2427845299243927, "value_corner": 0.7650290727615356, "value_row": 0.4276111423969269, "value_any": 0.2427845299243927, "value_bot": 0.03540264815092087, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01980.png", "entropy": 0.09955379366874695} +{"ts": "2026-01-29T22:04:51.657455Z", "loop": 1985, "env_steps": 1219584000, "exact_value_avg": 0.4521237313747406, "regret_dist": 0.35165366530418396, "regret_other_env": 0.5860626101493835, "regret_corner": 4.0218732465291396e-05, "regret_row": 0.3706294000148773, "regret_any": 0.5860626101493835, "regret_bot": 0.7607411742210388, "value_dist": 0.4521237313747406, "value_other_env": 0.243490532040596, "value_corner": 0.7650734782218933, "value_row": 0.4260596036911011, "value_any": 0.243490532040596, "value_bot": 0.03594782575964928, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01985.png", "entropy": 0.08882205933332443} +{"ts": "2026-01-29T22:04:57.505878Z", "loop": 1990, "env_steps": 1222656000, "exact_value_avg": 0.4522092938423157, "regret_dist": 0.3515681028366089, "regret_other_env": 0.5859290361404419, "regret_corner": 2.6645760954124853e-05, "regret_row": 0.37147849798202515, "regret_any": 0.5859290361404419, "regret_bot": 0.7604162693023682, "value_dist": 0.4522092938423157, "value_other_env": 0.24362406134605408, "value_corner": 0.7650871276855469, "value_row": 0.425210565328598, "value_any": 0.24362406134605408, "value_bot": 0.036272794008255005, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01990.png", "entropy": 0.08176377415657043} +{"ts": "2026-01-29T22:05:03.353458Z", "loop": 1995, "env_steps": 1225728000, "exact_value_avg": 0.45178520679473877, "regret_dist": 0.3519921898841858, "regret_other_env": 0.5866346955299377, "regret_corner": 2.838919681380503e-05, "regret_row": 0.37742120027542114, "regret_any": 0.5866346955299377, "regret_bot": 0.7595810890197754, "value_dist": 0.45178520679473877, "value_other_env": 0.24291841685771942, "value_corner": 0.7650853395462036, "value_row": 0.41926780343055725, "value_any": 0.24291841685771942, "value_bot": 0.03710801154375076, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_01995.png", "entropy": 0.0763118714094162} +{"ts": "2026-01-29T22:05:09.200658Z", "loop": 2000, "env_steps": 1228800000, "exact_value_avg": 0.4509010314941406, "regret_dist": 0.35287636518478394, "regret_other_env": 0.58809494972229, "regret_corner": 4.8403941036667675e-05, "regret_row": 0.3885500133037567, "regret_any": 0.58809494972229, "regret_bot": 0.7590731978416443, "value_dist": 0.4509010314941406, "value_other_env": 0.24145814776420593, "value_corner": 0.7650653123855591, "value_row": 0.40813902020454407, "value_any": 0.24145814776420593, "value_bot": 0.03761586546897888, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02000.png", "entropy": 0.07491429895162582} +{"ts": "2026-01-29T22:05:20.848473Z", "loop": 2010, "env_steps": 1234944000, "exact_value_avg": 0.45227184891700745, "regret_dist": 0.3515055477619171, "regret_other_env": 0.5858294367790222, "regret_corner": 1.9678971511893906e-05, "regret_row": 0.37163934111595154, "regret_any": 0.5858294367790222, "regret_bot": 0.7603273391723633, "value_dist": 0.45227184891700745, "value_other_env": 0.24372367560863495, "value_corner": 0.7650940418243408, "value_row": 0.42504969239234924, "value_any": 0.24372367560863495, "value_bot": 0.0363616943359375, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02010.png", "entropy": 0.07729091495275497} +{"ts": "2026-01-29T22:05:32.509390Z", "loop": 2020, "env_steps": 1241088000, "exact_value_avg": 0.452303409576416, "regret_dist": 0.35147395730018616, "regret_other_env": 0.5857787132263184, "regret_corner": 1.679311208135914e-05, "regret_row": 0.371416300535202, "regret_any": 0.5857787132263184, "regret_bot": 0.7603644132614136, "value_dist": 0.452303409576416, "value_other_env": 0.24377435445785522, "value_corner": 0.7650969624519348, "value_row": 0.42527276277542114, "value_any": 0.24377435445785522, "value_bot": 0.03632465377449989, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02020.png", "entropy": 0.07582515478134155} +{"ts": "2026-01-29T22:05:44.168131Z", "loop": 2030, "env_steps": 1247232000, "exact_value_avg": 0.4523223638534546, "regret_dist": 0.35145509243011475, "regret_other_env": 0.585747480392456, "regret_corner": 1.644094845687505e-05, "regret_row": 0.37095627188682556, "regret_any": 0.585747480392456, "regret_bot": 0.7605619430541992, "value_dist": 0.4523223638534546, "value_other_env": 0.2438056915998459, "value_corner": 0.7650973200798035, "value_row": 0.4257327914237976, "value_any": 0.2438056915998459, "value_bot": 0.03612701967358589, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02030.png", "entropy": 0.0760805532336235} +{"ts": "2026-01-29T22:05:55.818450Z", "loop": 2040, "env_steps": 1253376000, "exact_value_avg": 0.4504367709159851, "regret_dist": 0.35334059596061707, "regret_other_env": 0.5888583064079285, "regret_corner": 6.402830331353471e-05, "regret_row": 0.3675142526626587, "regret_any": 0.5888583064079285, "regret_bot": 0.763433039188385, "value_dist": 0.4504367709159851, "value_other_env": 0.2406948208808899, "value_corner": 0.7650496363639832, "value_row": 0.4291747808456421, "value_any": 0.2406948208808899, "value_bot": 0.03325605392456055, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02040.png", "entropy": 0.09452319890260696} +{"ts": "2026-01-29T22:06:07.491284Z", "loop": 2050, "env_steps": 1259520000, "exact_value_avg": 0.45179784297943115, "regret_dist": 0.351979523897171, "regret_other_env": 0.5866287350654602, "regret_corner": 5.649030299537117e-06, "regret_row": 0.3727581799030304, "regret_any": 0.5866287350654602, "regret_bot": 0.7610204815864563, "value_dist": 0.45179784297943115, "value_other_env": 0.24292436242103577, "value_corner": 0.7651081085205078, "value_row": 0.4239308536052704, "value_any": 0.24292436242103577, "value_bot": 0.035668544471263885, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02050.png", "entropy": 0.0636540949344635} +{"ts": "2026-01-29T22:06:19.168100Z", "loop": 2060, "env_steps": 1265664000, "exact_value_avg": 0.45003247261047363, "regret_dist": 0.3537449240684509, "regret_other_env": 0.5895677804946899, "regret_corner": 1.0552505955274682e-05, "regret_row": 0.39309200644493103, "regret_any": 0.5895677804946899, "regret_bot": 0.7588282823562622, "value_dist": 0.45003247261047363, "value_other_env": 0.23998534679412842, "value_corner": 0.7651031613349915, "value_row": 0.40359699726104736, "value_any": 0.23998534679412842, "value_bot": 0.037860795855522156, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02060.png", "entropy": 0.05877930298447609} +{"ts": "2026-01-29T22:06:30.843897Z", "loop": 2070, "env_steps": 1271808000, "exact_value_avg": 0.4518178701400757, "regret_dist": 0.3519595265388489, "regret_other_env": 0.5865881443023682, "regret_corner": 1.655171399761457e-05, "regret_row": 0.3759700655937195, "regret_any": 0.5865881443023682, "regret_bot": 0.7599586248397827, "value_dist": 0.4518178701400757, "value_other_env": 0.2429649531841278, "value_corner": 0.7650972008705139, "value_row": 0.4207189381122589, "value_any": 0.2429649531841278, "value_bot": 0.03673044592142105, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02070.png", "entropy": 0.06110777705907822} +{"ts": "2026-01-29T22:06:42.503092Z", "loop": 2080, "env_steps": 1277952000, "exact_value_avg": 0.4509970545768738, "regret_dist": 0.3527803122997284, "regret_other_env": 0.5879148840904236, "regret_corner": 7.842779450584203e-05, "regret_row": 0.3670576512813568, "regret_any": 0.5879148840904236, "regret_bot": 0.762482762336731, "value_dist": 0.4509970545768738, "value_other_env": 0.24163822829723358, "value_corner": 0.7650352716445923, "value_row": 0.42963141202926636, "value_any": 0.24163822829723358, "value_bot": 0.03420625999569893, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02080.png", "entropy": 0.08635164797306061} +{"ts": "2026-01-29T22:06:54.177024Z", "loop": 2090, "env_steps": 1284096000, "exact_value_avg": 0.45234084129333496, "regret_dist": 0.35143646597862244, "regret_other_env": 0.5857232809066772, "regret_corner": 6.205837053130381e-06, "regret_row": 0.36932605504989624, "regret_any": 0.5857232809066772, "regret_bot": 0.7610957026481628, "value_dist": 0.45234084129333496, "value_other_env": 0.24382974207401276, "value_corner": 0.7651075124740601, "value_row": 0.42736297845840454, "value_any": 0.24382974207401276, "value_bot": 0.03559333458542824, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02090.png", "entropy": 0.06213776022195816} +{"ts": "2026-01-29T22:07:05.842481Z", "loop": 2100, "env_steps": 1290240000, "exact_value_avg": 0.4493659734725952, "regret_dist": 0.35441136360168457, "regret_other_env": 0.5906383991241455, "regret_corner": 7.078449561959133e-05, "regret_row": 0.3991229236125946, "regret_any": 0.5906383991241455, "regret_bot": 0.7586687803268433, "value_dist": 0.4493659734725952, "value_other_env": 0.23891468346118927, "value_corner": 0.7650429010391235, "value_row": 0.39756616950035095, "value_any": 0.23891468346118927, "value_bot": 0.03802027553319931, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02100.png", "entropy": 0.0613136924803257} +{"ts": "2026-01-29T22:07:17.504420Z", "loop": 2110, "env_steps": 1296384000, "exact_value_avg": 0.45103079080581665, "regret_dist": 0.35274654626846313, "regret_other_env": 0.5879021883010864, "regret_corner": 1.3034046787652187e-05, "regret_row": 0.3857409358024597, "regret_any": 0.5879021883010864, "regret_bot": 0.759073793888092, "value_dist": 0.45103079080581665, "value_other_env": 0.24165084958076477, "value_corner": 0.7651007175445557, "value_row": 0.41094812750816345, "value_any": 0.24165084958076477, "value_bot": 0.03761531785130501, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02110.png", "entropy": 0.05934711918234825} +{"ts": "2026-01-29T22:07:29.169488Z", "loop": 2120, "env_steps": 1302528000, "exact_value_avg": 0.4475638270378113, "regret_dist": 0.3562135398387909, "regret_other_env": 0.593672513961792, "regret_corner": 2.5053323042811826e-05, "regret_row": 0.36768636107444763, "regret_any": 0.593672513961792, "regret_bot": 0.7650391459465027, "value_dist": 0.4475638270378113, "value_other_env": 0.23588056862354279, "value_corner": 0.765088677406311, "value_row": 0.42900270223617554, "value_any": 0.23588056862354279, "value_bot": 0.031649913638830185, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02120.png", "entropy": 0.08547448366880417} +{"ts": "2026-01-29T22:07:40.832731Z", "loop": 2130, "env_steps": 1308672000, "exact_value_avg": 0.45213109254837036, "regret_dist": 0.3516462743282318, "regret_other_env": 0.5860733985900879, "regret_corner": 5.569557743001496e-06, "regret_row": 0.3717350363731384, "regret_any": 0.5860733985900879, "regret_bot": 0.7606098651885986, "value_dist": 0.45213109254837036, "value_other_env": 0.2434796839952469, "value_corner": 0.7651081681251526, "value_row": 0.42495402693748474, "value_any": 0.2434796839952469, "value_bot": 0.036079198122024536, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02130.png", "entropy": 0.05716186389327049} +{"ts": "2026-01-29T22:07:52.490209Z", "loop": 2140, "env_steps": 1314816000, "exact_value_avg": 0.4523271918296814, "regret_dist": 0.35145023465156555, "regret_other_env": 0.5857459902763367, "regret_corner": 6.588300493604038e-06, "regret_row": 0.3687497675418854, "regret_any": 0.5857459902763367, "regret_bot": 0.7617040276527405, "value_dist": 0.4523271918296814, "value_other_env": 0.24380718171596527, "value_corner": 0.7651071548461914, "value_row": 0.4279393255710602, "value_any": 0.24380718171596527, "value_bot": 0.0349850207567215, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02140.png", "entropy": 0.062071267515420914} +{"ts": "2026-01-29T22:08:04.162977Z", "loop": 2150, "env_steps": 1320960000, "exact_value_avg": 0.4523463249206543, "regret_dist": 0.3514310419559479, "regret_other_env": 0.5857143402099609, "regret_corner": 6.015102371748071e-06, "regret_row": 0.3703094720840454, "regret_any": 0.5857143402099609, "regret_bot": 0.7605718970298767, "value_dist": 0.4523463249206543, "value_other_env": 0.24383869767189026, "value_corner": 0.7651076912879944, "value_row": 0.42637956142425537, "value_any": 0.24383869767189026, "value_bot": 0.03611713647842407, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02150.png", "entropy": 0.05667663738131523} +{"ts": "2026-01-29T22:08:15.809744Z", "loop": 2160, "env_steps": 1327104000, "exact_value_avg": 0.45226871967315674, "regret_dist": 0.3515087068080902, "regret_other_env": 0.5858444571495056, "regret_corner": 5.059441264165798e-06, "regret_row": 0.37015798687934875, "regret_any": 0.5858444571495056, "regret_bot": 0.7609394192695618, "value_dist": 0.45226871967315674, "value_other_env": 0.24370871484279633, "value_corner": 0.7651086449623108, "value_row": 0.426531046628952, "value_any": 0.24370871484279633, "value_bot": 0.03574962913990021, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02160.png", "entropy": 0.05626780912280083} +{"ts": "2026-01-29T22:08:27.458698Z", "loop": 2170, "env_steps": 1333248000, "exact_value_avg": 0.4519994854927063, "regret_dist": 0.3517778515815735, "regret_other_env": 0.5862916111946106, "regret_corner": 7.178883151937043e-06, "regret_row": 0.36859503388404846, "regret_any": 0.5862916111946106, "regret_bot": 0.7621281743049622, "value_dist": 0.4519994854927063, "value_other_env": 0.2432614266872406, "value_corner": 0.7651065587997437, "value_row": 0.4280939996242523, "value_any": 0.2432614266872406, "value_bot": 0.03456084802746773, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02170.png", "entropy": 0.06386282294988632} +{"ts": "2026-01-29T22:08:39.143274Z", "loop": 2180, "env_steps": 1339392000, "exact_value_avg": 0.45149028301239014, "regret_dist": 0.35228705406188965, "regret_other_env": 0.5871381759643555, "regret_corner": 1.03597849374637e-05, "regret_row": 0.3682759404182434, "regret_any": 0.5871381759643555, "regret_bot": 0.7623496055603027, "value_dist": 0.45149028301239014, "value_other_env": 0.24241486191749573, "value_corner": 0.7651033997535706, "value_row": 0.428413063287735, "value_any": 0.24241486191749573, "value_bot": 0.03433940187096596, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02180.png", "entropy": 0.06898217648267746} +{"ts": "2026-01-29T22:08:50.831533Z", "loop": 2190, "env_steps": 1345536000, "exact_value_avg": 0.4523783326148987, "regret_dist": 0.35139909386634827, "regret_other_env": 0.5856568217277527, "regret_corner": 1.2467802662285976e-05, "regret_row": 0.37047114968299866, "regret_any": 0.5856568217277527, "regret_bot": 0.7601549029350281, "value_dist": 0.4523783326148987, "value_other_env": 0.24389636516571045, "value_corner": 0.7651012539863586, "value_row": 0.4262179136276245, "value_any": 0.24389636516571045, "value_bot": 0.03653407841920853, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02190.png", "entropy": 0.05489656701683998} +{"ts": "2026-01-29T22:09:02.497014Z", "loop": 2200, "env_steps": 1351680000, "exact_value_avg": 0.45018255710601807, "regret_dist": 0.3535948097705841, "regret_other_env": 0.5888230800628662, "regret_corner": 0.0007523546810261905, "regret_row": 0.3903900980949402, "regret_any": 0.5888230800628662, "regret_bot": 0.7589974403381348, "value_dist": 0.45018255710601807, "value_other_env": 0.24072997272014618, "value_corner": 0.7643614411354065, "value_row": 0.406298965215683, "value_any": 0.24072997272014618, "value_bot": 0.03769160807132721, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02200.png", "entropy": 0.06473555415868759} +{"ts": "2026-01-29T22:09:14.165581Z", "loop": 2210, "env_steps": 1357824000, "exact_value_avg": 0.4520743489265442, "regret_dist": 0.351703017950058, "regret_other_env": 0.5861164331436157, "regret_corner": 8.281916962005198e-05, "regret_row": 0.3753836452960968, "regret_any": 0.5861164331436157, "regret_bot": 0.7597427368164062, "value_dist": 0.4520743489265442, "value_other_env": 0.24343660473823547, "value_corner": 0.7650309801101685, "value_row": 0.42130541801452637, "value_any": 0.24343660473823547, "value_bot": 0.03694629296660423, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02210.png", "entropy": 0.06451839208602905} +{"ts": "2026-01-29T22:09:25.829475Z", "loop": 2220, "env_steps": 1363968000, "exact_value_avg": 0.4510740339756012, "regret_dist": 0.352703332901001, "regret_other_env": 0.5878015756607056, "regret_corner": 5.593200694420375e-05, "regret_row": 0.3643122911453247, "regret_any": 0.5878015756607056, "regret_bot": 0.7627375721931458, "value_dist": 0.4510740339756012, "value_other_env": 0.2417515218257904, "value_corner": 0.7650578022003174, "value_row": 0.43237677216529846, "value_any": 0.2417515218257904, "value_bot": 0.03395146504044533, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02220.png", "entropy": 0.08233971893787384} +{"ts": "2026-01-29T22:09:37.491939Z", "loop": 2230, "env_steps": 1370112000, "exact_value_avg": 0.4522269368171692, "regret_dist": 0.351550430059433, "regret_other_env": 0.585905909538269, "regret_corner": 1.718004568829201e-05, "regret_row": 0.3664630055427551, "regret_any": 0.585905909538269, "regret_bot": 0.7620159983634949, "value_dist": 0.4522269368171692, "value_other_env": 0.24364715814590454, "value_corner": 0.7650966048240662, "value_row": 0.43022602796554565, "value_any": 0.24364715814590454, "value_bot": 0.034673064947128296, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02230.png", "entropy": 0.07089965790510178} +{"ts": "2026-01-29T22:09:49.160322Z", "loop": 2240, "env_steps": 1376256000, "exact_value_avg": 0.4525221586227417, "regret_dist": 0.3512552082538605, "regret_other_env": 0.585419237613678, "regret_corner": 9.158750799542759e-06, "regret_row": 0.3701658248901367, "regret_any": 0.585419237613678, "regret_bot": 0.7603428363800049, "value_dist": 0.4525221586227417, "value_other_env": 0.2441338449716568, "value_corner": 0.7651045918464661, "value_row": 0.42652323842048645, "value_any": 0.2441338449716568, "value_bot": 0.0363461934030056, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02240.png", "entropy": 0.055775102227926254} +{"ts": "2026-01-29T22:10:00.828356Z", "loop": 2250, "env_steps": 1382400000, "exact_value_avg": 0.45200690627098083, "regret_dist": 0.35177043080329895, "regret_other_env": 0.5862753987312317, "regret_corner": 1.2953580153407529e-05, "regret_row": 0.3672477900981903, "regret_any": 0.5862753987312317, "regret_bot": 0.7624149918556213, "value_dist": 0.45200690627098083, "value_other_env": 0.2432776391506195, "value_corner": 0.7651007771492004, "value_row": 0.42944127321243286, "value_any": 0.2432776391506195, "value_bot": 0.03427405655384064, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02250.png", "entropy": 0.06735033541917801} +{"ts": "2026-01-29T22:10:12.472397Z", "loop": 2260, "env_steps": 1388544000, "exact_value_avg": 0.4525482952594757, "regret_dist": 0.35122910141944885, "regret_other_env": 0.5853766202926636, "regret_corner": 7.801255378581118e-06, "regret_row": 0.36905092000961304, "regret_any": 0.5853766202926636, "regret_bot": 0.761247992515564, "value_dist": 0.4525482952594757, "value_other_env": 0.24417652189731598, "value_corner": 0.7651059031486511, "value_row": 0.42763808369636536, "value_any": 0.24417652189731598, "value_bot": 0.0354410745203495, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02260.png", "entropy": 0.054417457431554794} +{"ts": "2026-01-29T22:10:24.119544Z", "loop": 2270, "env_steps": 1394688000, "exact_value_avg": 0.4504339098930359, "regret_dist": 0.3533434569835663, "regret_other_env": 0.5888667106628418, "regret_corner": 5.8556601288728416e-05, "regret_row": 0.392936646938324, "regret_any": 0.5888667106628418, "regret_bot": 0.7588886618614197, "value_dist": 0.4504339098930359, "value_other_env": 0.24068638682365417, "value_corner": 0.7650551795959473, "value_row": 0.4037524461746216, "value_any": 0.24068638682365417, "value_bot": 0.037800442427396774, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02270.png", "entropy": 0.0594184547662735} +{"ts": "2026-01-29T22:10:35.786359Z", "loop": 2280, "env_steps": 1400832000, "exact_value_avg": 0.4520123600959778, "regret_dist": 0.35176509618759155, "regret_other_env": 0.5862483978271484, "regret_corner": 4.005829759989865e-05, "regret_row": 0.3758501410484314, "regret_any": 0.5862483978271484, "regret_bot": 0.7596726417541504, "value_dist": 0.4520123600959778, "value_other_env": 0.24330474436283112, "value_corner": 0.7650737166404724, "value_row": 0.420838862657547, "value_any": 0.24330474436283112, "value_bot": 0.03701641038060188, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02280.png", "entropy": 0.05984936282038689} +{"ts": "2026-01-29T22:10:47.452030Z", "loop": 2290, "env_steps": 1406976000, "exact_value_avg": 0.45267242193222046, "regret_dist": 0.3511050045490265, "regret_other_env": 0.5851655602455139, "regret_corner": 1.4142196050670464e-05, "regret_row": 0.36815160512924194, "regret_any": 0.5851655602455139, "regret_bot": 0.7611157894134521, "value_dist": 0.45267242193222046, "value_other_env": 0.24438756704330444, "value_corner": 0.7650996446609497, "value_row": 0.42853742837905884, "value_any": 0.24438756704330444, "value_bot": 0.035573240369558334, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02290.png", "entropy": 0.06081831827759743} +{"ts": "2026-01-29T22:10:59.103754Z", "loop": 2300, "env_steps": 1413120000, "exact_value_avg": 0.44917333126068115, "regret_dist": 0.3546040654182434, "regret_other_env": 0.5908967852592468, "regret_corner": 0.0001649459300097078, "regret_row": 0.36263206601142883, "regret_any": 0.5908967852592468, "regret_bot": 0.7641644477844238, "value_dist": 0.44917333126068115, "value_other_env": 0.23865629732608795, "value_corner": 0.764948844909668, "value_row": 0.43405699729919434, "value_any": 0.23865629732608795, "value_bot": 0.03252461180090904, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02300.png", "entropy": 0.08979210257530212} +{"ts": "2026-01-29T22:11:10.781792Z", "loop": 2310, "env_steps": 1419264000, "exact_value_avg": 0.4513077437877655, "regret_dist": 0.35246962308883667, "regret_other_env": 0.5874413847923279, "regret_corner": 1.1928877029276919e-05, "regret_row": 0.36753395199775696, "regret_any": 0.5874413847923279, "regret_bot": 0.7627697587013245, "value_dist": 0.4513077437877655, "value_other_env": 0.2421116828918457, "value_corner": 0.7651017904281616, "value_row": 0.4291550815105438, "value_any": 0.2421116828918457, "value_bot": 0.0339193120598793, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02310.png", "entropy": 0.06472214311361313} +{"ts": "2026-01-29T22:11:22.457330Z", "loop": 2320, "env_steps": 1425408000, "exact_value_avg": 0.45166289806365967, "regret_dist": 0.3521144986152649, "regret_other_env": 0.5868540406227112, "regret_corner": 5.116065494803479e-06, "regret_row": 0.37642890214920044, "regret_any": 0.5868540406227112, "regret_bot": 0.7611696720123291, "value_dist": 0.45166289806365967, "value_other_env": 0.24269910156726837, "value_corner": 0.765108585357666, "value_row": 0.42026013135910034, "value_any": 0.24269910156726837, "value_bot": 0.03551936149597168, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02320.png", "entropy": 0.04860778525471687} +{"ts": "2026-01-29T22:11:34.127766Z", "loop": 2330, "env_steps": 1431552000, "exact_value_avg": 0.4510684609413147, "regret_dist": 0.3527089059352875, "regret_other_env": 0.587844729423523, "regret_corner": 5.141894234839128e-06, "regret_row": 0.38492366671562195, "regret_any": 0.587844729423523, "regret_bot": 0.7595390677452087, "value_dist": 0.4510684609413147, "value_other_env": 0.24170835316181183, "value_corner": 0.765108585357666, "value_row": 0.41176533699035645, "value_any": 0.24170835316181183, "value_bot": 0.03715001791715622, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02330.png", "entropy": 0.04798939824104309} +{"ts": "2026-01-29T22:11:45.779099Z", "loop": 2340, "env_steps": 1437696000, "exact_value_avg": 0.451479434967041, "regret_dist": 0.35229796171188354, "regret_other_env": 0.587157666683197, "regret_corner": 8.344650268554688e-06, "regret_row": 0.38100099563598633, "regret_any": 0.587157666683197, "regret_bot": 0.7592058181762695, "value_dist": 0.451479434967041, "value_other_env": 0.24239543080329895, "value_corner": 0.7651053667068481, "value_row": 0.41568809747695923, "value_any": 0.24239543080329895, "value_bot": 0.03748326748609543, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02340.png", "entropy": 0.05004710704088211} +{"ts": "2026-01-29T22:11:57.435581Z", "loop": 2350, "env_steps": 1443840000, "exact_value_avg": 0.4525148272514343, "regret_dist": 0.35126256942749023, "regret_other_env": 0.5854318141937256, "regret_corner": 8.626779163023457e-06, "regret_row": 0.36817774176597595, "regret_any": 0.5854318141937256, "regret_bot": 0.7618573307991028, "value_dist": 0.4525148272514343, "value_other_env": 0.2441212683916092, "value_corner": 0.7651050686836243, "value_row": 0.4285113215446472, "value_any": 0.2441212683916092, "value_bot": 0.034831658005714417, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02350.png", "entropy": 0.055635716766119} +{"ts": "2026-01-29T22:12:09.099004Z", "loop": 2360, "env_steps": 1449984000, "exact_value_avg": 0.4516719877719879, "regret_dist": 0.35210537910461426, "regret_other_env": 0.5868263840675354, "regret_corner": 2.3855269319028594e-05, "regret_row": 0.36337810754776, "regret_any": 0.5868263840675354, "regret_bot": 0.7629308104515076, "value_dist": 0.4516719877719879, "value_other_env": 0.24272674322128296, "value_corner": 0.7650898098945618, "value_row": 0.43331092596054077, "value_any": 0.24272674322128296, "value_bot": 0.0337582528591156, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02360.png", "entropy": 0.07335931807756424} +{"ts": "2026-01-29T22:12:20.755506Z", "loop": 2370, "env_steps": 1456128000, "exact_value_avg": 0.45262593030929565, "regret_dist": 0.3511514365673065, "regret_other_env": 0.5852413773536682, "regret_corner": 1.6456346202176064e-05, "regret_row": 0.37022846937179565, "regret_any": 0.5852413773536682, "regret_bot": 0.7599762678146362, "value_dist": 0.45262593030929565, "value_other_env": 0.24431176483631134, "value_corner": 0.7650972008705139, "value_row": 0.4264605641365051, "value_any": 0.24431176483631134, "value_bot": 0.03671273961663246, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02370.png", "entropy": 0.054465778172016144} +{"ts": "2026-01-29T22:12:32.419879Z", "loop": 2380, "env_steps": 1462272000, "exact_value_avg": 0.4486158490180969, "regret_dist": 0.35516151785850525, "regret_other_env": 0.5904962420463562, "regret_corner": 0.0021594271529465914, "regret_row": 0.41737231612205505, "regret_any": 0.5904962420463562, "regret_bot": 0.7590625882148743, "value_dist": 0.4486158490180969, "value_other_env": 0.23905688524246216, "value_corner": 0.7629542946815491, "value_row": 0.3793167471885681, "value_any": 0.23905688524246216, "value_bot": 0.03762645274400711, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02380.png", "entropy": 0.06807054579257965} +{"ts": "2026-01-29T22:12:44.061443Z", "loop": 2390, "env_steps": 1468416000, "exact_value_avg": 0.45264554023742676, "regret_dist": 0.351131796836853, "regret_other_env": 0.5851972699165344, "regret_corner": 3.3554435503901914e-05, "regret_row": 0.36692389845848083, "regret_any": 0.5851972699165344, "regret_bot": 0.7608327865600586, "value_dist": 0.45264554023742676, "value_other_env": 0.24435578286647797, "value_corner": 0.7650801539421082, "value_row": 0.42976513504981995, "value_any": 0.24435578286647797, "value_bot": 0.0358562208712101, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02390.png", "entropy": 0.070034459233284} +{"ts": "2026-01-29T22:12:55.705025Z", "loop": 2400, "env_steps": 1474560000, "exact_value_avg": 0.45170289278030396, "regret_dist": 0.3520744740962982, "regret_other_env": 0.5867530107498169, "regret_corner": 5.659212911268696e-05, "regret_row": 0.3641048073768616, "regret_any": 0.5867530107498169, "regret_bot": 0.7626000642776489, "value_dist": 0.45170289278030396, "value_other_env": 0.24280008673667908, "value_corner": 0.7650571465492249, "value_row": 0.4325842559337616, "value_any": 0.24280008673667908, "value_bot": 0.03408903628587723, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02400.png", "entropy": 0.08137276768684387} +{"ts": "2026-01-29T22:13:07.362431Z", "loop": 2410, "env_steps": 1480704000, "exact_value_avg": 0.451779842376709, "regret_dist": 0.3519975543022156, "regret_other_env": 0.5866313576698303, "regret_corner": 4.6800574637018144e-05, "regret_row": 0.38207781314849854, "regret_any": 0.5866313576698303, "regret_bot": 0.759668231010437, "value_dist": 0.451779842376709, "value_other_env": 0.24292178452014923, "value_corner": 0.765066921710968, "value_row": 0.41461125016212463, "value_any": 0.24292178452014923, "value_bot": 0.037020836025476456, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02410.png", "entropy": 0.06601231545209885} +{"ts": "2026-01-29T22:13:19.018845Z", "loop": 2420, "env_steps": 1486848000, "exact_value_avg": 0.4492051899433136, "regret_dist": 0.35457220673561096, "regret_other_env": 0.5908716320991516, "regret_corner": 0.00012301704555284232, "regret_row": 0.4263506233692169, "regret_any": 0.5908716320991516, "regret_bot": 0.7593047022819519, "value_dist": 0.4492051899433136, "value_other_env": 0.23868142068386078, "value_corner": 0.7649908065795898, "value_row": 0.37033843994140625, "value_any": 0.23868142068386078, "value_bot": 0.03738431632518768, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02420.png", "entropy": 0.06995246559381485} +{"ts": "2026-01-29T22:13:30.677365Z", "loop": 2430, "env_steps": 1492992000, "exact_value_avg": 0.4512805938720703, "regret_dist": 0.35249677300453186, "regret_other_env": 0.5874336361885071, "regret_corner": 9.140471956925467e-05, "regret_row": 0.3934086859226227, "regret_any": 0.5874336361885071, "regret_bot": 0.7599458694458008, "value_dist": 0.4512805938720703, "value_other_env": 0.2421194463968277, "value_corner": 0.765022337436676, "value_row": 0.4032803475856781, "value_any": 0.2421194463968277, "value_bot": 0.03674313798546791, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02430.png", "entropy": 0.07312694936990738} +{"ts": "2026-01-29T22:13:42.329378Z", "loop": 2440, "env_steps": 1499136000, "exact_value_avg": 0.45206236839294434, "regret_dist": 0.3517150282859802, "regret_other_env": 0.586132287979126, "regret_corner": 8.913130295695737e-05, "regret_row": 0.3777390718460083, "regret_any": 0.586132287979126, "regret_bot": 0.7607471346855164, "value_dist": 0.45206236839294434, "value_other_env": 0.24342080950737, "value_corner": 0.7650246024131775, "value_row": 0.4189499318599701, "value_any": 0.24342080950737, "value_bot": 0.03594197705388069, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02440.png", "entropy": 0.08372566848993301} +{"ts": "2026-01-29T22:13:53.977665Z", "loop": 2450, "env_steps": 1505280000, "exact_value_avg": 0.45144954323768616, "regret_dist": 0.3523278534412384, "regret_other_env": 0.5870854258537292, "regret_corner": 0.00019151171727571636, "regret_row": 0.38341230154037476, "regret_any": 0.5870854258537292, "regret_bot": 0.761039137840271, "value_dist": 0.45144954323768616, "value_other_env": 0.2424677014350891, "value_corner": 0.7649222612380981, "value_row": 0.4132767915725708, "value_any": 0.2424677014350891, "value_bot": 0.035649970173835754, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02450.png", "entropy": 0.09304271638393402} +{"ts": "2026-01-29T22:14:05.629029Z", "loop": 2460, "env_steps": 1511424000, "exact_value_avg": 0.45004963874816895, "regret_dist": 0.353727787733078, "regret_other_env": 0.589187502861023, "regret_corner": 0.0005381475202739239, "regret_row": 0.39302486181259155, "regret_any": 0.589187502861023, "regret_bot": 0.7614577412605286, "value_dist": 0.45004963874816895, "value_other_env": 0.2403656393289566, "value_corner": 0.7645756006240845, "value_row": 0.40366417169570923, "value_any": 0.2403656393289566, "value_bot": 0.03523128107190132, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02460.png", "entropy": 0.10607234388589859} +{"ts": "2026-01-29T22:14:17.290743Z", "loop": 2470, "env_steps": 1517568000, "exact_value_avg": 0.4522464871406555, "regret_dist": 0.35153084993362427, "regret_other_env": 0.5858166813850403, "regret_corner": 0.00010205806029262021, "regret_row": 0.37571683526039124, "regret_any": 0.5858166813850403, "regret_bot": 0.760604977607727, "value_dist": 0.4522464871406555, "value_other_env": 0.2437364161014557, "value_corner": 0.7650116086006165, "value_row": 0.42097222805023193, "value_any": 0.2437364161014557, "value_bot": 0.03608408197760582, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02470.png", "entropy": 0.07631883025169373} +{"ts": "2026-01-29T22:14:28.943221Z", "loop": 2480, "env_steps": 1523712000, "exact_value_avg": 0.4527701139450073, "regret_dist": 0.35100722312927246, "regret_other_env": 0.5849937796592712, "regret_corner": 2.7379892344470136e-05, "regret_row": 0.3639058768749237, "regret_any": 0.5849937796592712, "regret_bot": 0.7614246606826782, "value_dist": 0.4527701139450073, "value_other_env": 0.24455927312374115, "value_corner": 0.7650864124298096, "value_row": 0.43278321623802185, "value_any": 0.24455927312374115, "value_bot": 0.03526438772678375, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02480.png", "entropy": 0.06712181866168976} +{"ts": "2026-01-29T22:14:40.598189Z", "loop": 2490, "env_steps": 1529856000, "exact_value_avg": 0.45257067680358887, "regret_dist": 0.3512066900730133, "regret_other_env": 0.5853292942047119, "regret_corner": 2.268701973662246e-05, "regret_row": 0.36450132727622986, "regret_any": 0.5853292942047119, "regret_bot": 0.7618619799613953, "value_dist": 0.45257067680358887, "value_other_env": 0.24422374367713928, "value_corner": 0.7650911211967468, "value_row": 0.4321877062320709, "value_any": 0.24422374367713928, "value_bot": 0.03482705354690552, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02490.png", "entropy": 0.0629562959074974} +{"ts": "2026-01-29T22:14:52.250656Z", "loop": 2500, "env_steps": 1536000000, "exact_value_avg": 0.45180952548980713, "regret_dist": 0.35196778178215027, "regret_other_env": 0.5866018533706665, "regret_corner": 1.6638638044241816e-05, "regret_row": 0.3645973205566406, "regret_any": 0.5866018533706665, "regret_bot": 0.7630128264427185, "value_dist": 0.45180952548980713, "value_other_env": 0.2429511696100235, "value_corner": 0.7650970816612244, "value_row": 0.43209171295166016, "value_any": 0.2429511696100235, "value_bot": 0.03367620334029198, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02500.png", "entropy": 0.06277137249708176} +{"ts": "2026-01-29T22:15:03.906672Z", "loop": 2510, "env_steps": 1542144000, "exact_value_avg": 0.45268964767456055, "regret_dist": 0.351087749004364, "regret_other_env": 0.5851408839225769, "regret_corner": 8.071959200606216e-06, "regret_row": 0.3687416613101959, "regret_any": 0.5851408839225769, "regret_bot": 0.7609869241714478, "value_dist": 0.45268964767456055, "value_other_env": 0.24441224336624146, "value_corner": 0.765105664730072, "value_row": 0.42794734239578247, "value_any": 0.24441224336624146, "value_bot": 0.03570210933685303, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02510.png", "entropy": 0.04785897955298424} +{"ts": "2026-01-29T22:15:15.579145Z", "loop": 2520, "env_steps": 1548288000, "exact_value_avg": 0.44902318716049194, "regret_dist": 0.35475417971611023, "regret_other_env": 0.591224730014801, "regret_corner": 4.838804670725949e-05, "regret_row": 0.4073658287525177, "regret_any": 0.591224730014801, "regret_bot": 0.7586109638214111, "value_dist": 0.44902318716049194, "value_other_env": 0.23832836747169495, "value_corner": 0.7650653719902039, "value_row": 0.38932323455810547, "value_any": 0.23832836747169495, "value_bot": 0.03807809203863144, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02520.png", "entropy": 0.05497034266591072} +{"ts": "2026-01-29T22:15:27.231057Z", "loop": 2530, "env_steps": 1554432000, "exact_value_avg": 0.45245450735092163, "regret_dist": 0.35132285952568054, "regret_other_env": 0.5855327844619751, "regret_corner": 7.986029231688008e-06, "regret_row": 0.37175536155700684, "regret_any": 0.5855327844619751, "regret_bot": 0.7595770359039307, "value_dist": 0.45245450735092163, "value_other_env": 0.24402037262916565, "value_corner": 0.7651057243347168, "value_row": 0.4249337613582611, "value_any": 0.24402037262916565, "value_bot": 0.03711198642849922, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02530.png", "entropy": 0.04908750206232071} +{"ts": "2026-01-29T22:15:38.891534Z", "loop": 2540, "env_steps": 1560576000, "exact_value_avg": 0.45278239250183105, "regret_dist": 0.35099491477012634, "regret_other_env": 0.5849835276603699, "regret_corner": 1.2011826584057417e-05, "regret_row": 0.3652534484863281, "regret_any": 0.5849835276603699, "regret_bot": 0.7617300152778625, "value_dist": 0.45278239250183105, "value_other_env": 0.24456949532032013, "value_corner": 0.7651017308235168, "value_row": 0.43143558502197266, "value_any": 0.24456949532032013, "value_bot": 0.03495904430747032, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02540.png", "entropy": 0.05353761091828346} +{"ts": "2026-01-29T22:15:50.555278Z", "loop": 2550, "env_steps": 1566720000, "exact_value_avg": 0.452514111995697, "regret_dist": 0.35126325488090515, "regret_other_env": 0.5854247808456421, "regret_corner": 2.0954013962182216e-05, "regret_row": 0.36301565170288086, "regret_any": 0.5854247808456421, "regret_bot": 0.7625432014465332, "value_dist": 0.452514111995697, "value_other_env": 0.2441282868385315, "value_corner": 0.7650927901268005, "value_row": 0.4336734116077423, "value_any": 0.2441282868385315, "value_bot": 0.03414582088589668, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02550.png", "entropy": 0.06236930936574936} +{"ts": "2026-01-29T22:16:02.215619Z", "loop": 2560, "env_steps": 1572864000, "exact_value_avg": 0.45062822103500366, "regret_dist": 0.3531491458415985, "regret_other_env": 0.5884244441986084, "regret_corner": 0.00023621968284714967, "regret_row": 0.36211591958999634, "regret_any": 0.5884244441986084, "regret_bot": 0.7635883688926697, "value_dist": 0.45062822103500366, "value_other_env": 0.24112866818904877, "value_corner": 0.7648774981498718, "value_row": 0.43457311391830444, "value_any": 0.24112866818904877, "value_bot": 0.03310069814324379, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02560.png", "entropy": 0.07807233929634094} +{"ts": "2026-01-29T22:16:13.871472Z", "loop": 2570, "env_steps": 1579008000, "exact_value_avg": 0.45272207260131836, "regret_dist": 0.3510552942752838, "regret_other_env": 0.5850866436958313, "regret_corner": 8.248786798503716e-06, "regret_row": 0.3690422475337982, "regret_any": 0.5850866436958313, "regret_bot": 0.7603105902671814, "value_dist": 0.45272207260131836, "value_other_env": 0.24446643888950348, "value_corner": 0.7651054859161377, "value_row": 0.42764678597450256, "value_any": 0.24446643888950348, "value_bot": 0.03637842461466789, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02570.png", "entropy": 0.04397670179605484} +{"ts": "2026-01-29T22:16:25.525963Z", "loop": 2580, "env_steps": 1585152000, "exact_value_avg": 0.45174843072891235, "regret_dist": 0.3520289957523346, "regret_other_env": 0.5867088437080383, "regret_corner": 9.151796803053003e-06, "regret_row": 0.3785002827644348, "regret_any": 0.5867088437080383, "regret_bot": 0.7589138746261597, "value_dist": 0.45174843072891235, "value_other_env": 0.24284431338310242, "value_corner": 0.7651045918464661, "value_row": 0.41818875074386597, "value_any": 0.24284431338310242, "value_bot": 0.0377751924097538, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02580.png", "entropy": 0.044077008962631226} +{"ts": "2026-01-29T22:16:37.192981Z", "loop": 2590, "env_steps": 1591296000, "exact_value_avg": 0.4525715708732605, "regret_dist": 0.3512057960033417, "regret_other_env": 0.5853369235992432, "regret_corner": 9.108583981287666e-06, "regret_row": 0.3700951039791107, "regret_any": 0.5853369235992432, "regret_bot": 0.7598327994346619, "value_dist": 0.4525715708732605, "value_other_env": 0.24421612918376923, "value_corner": 0.7651046514511108, "value_row": 0.42659392952919006, "value_any": 0.24421612918376923, "value_bot": 0.03685625270009041, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02590.png", "entropy": 0.04335649311542511} +{"ts": "2026-01-29T22:16:48.849202Z", "loop": 2600, "env_steps": 1597440000, "exact_value_avg": 0.4527929723262787, "regret_dist": 0.3509843945503235, "regret_other_env": 0.5849669575691223, "regret_corner": 1.0519723218749277e-05, "regret_row": 0.3677239418029785, "regret_any": 0.5849669575691223, "regret_bot": 0.7612842321395874, "value_dist": 0.4527929723262787, "value_other_env": 0.24458616971969604, "value_corner": 0.7651031613349915, "value_row": 0.42896515130996704, "value_any": 0.24458616971969604, "value_bot": 0.035404838621616364, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02600.png", "entropy": 0.047124143689870834} +{"ts": "2026-01-29T22:17:00.517946Z", "loop": 2610, "env_steps": 1603584000, "exact_value_avg": 0.45252692699432373, "regret_dist": 0.35125041007995605, "regret_other_env": 0.5854082107543945, "regret_corner": 1.3703108379559126e-05, "regret_row": 0.36368489265441895, "regret_any": 0.5854082107543945, "regret_bot": 0.7623827457427979, "value_dist": 0.45252692699432373, "value_other_env": 0.24414487183094025, "value_corner": 0.7651000022888184, "value_row": 0.43300411105155945, "value_any": 0.24414487183094025, "value_bot": 0.03430629149079323, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02610.png", "entropy": 0.05580006539821625} +{"ts": "2026-01-29T22:17:12.183565Z", "loop": 2620, "env_steps": 1609728000, "exact_value_avg": 0.45251375436782837, "regret_dist": 0.3512636125087738, "regret_other_env": 0.5854328274726868, "regret_corner": 9.7448628366692e-06, "regret_row": 0.3702313303947449, "regret_any": 0.5854328274726868, "regret_bot": 0.7598623633384705, "value_dist": 0.45251375436782837, "value_other_env": 0.2441202849149704, "value_corner": 0.7651039361953735, "value_row": 0.4264577031135559, "value_any": 0.2441202849149704, "value_bot": 0.036826666444540024, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02620.png", "entropy": 0.041738614439964294} +{"ts": "2026-01-29T22:17:23.834919Z", "loop": 2630, "env_steps": 1615872000, "exact_value_avg": 0.45218056440353394, "regret_dist": 0.35159680247306824, "regret_other_env": 0.5859875679016113, "regret_corner": 1.0641912922437768e-05, "regret_row": 0.3724272549152374, "regret_any": 0.5859875679016113, "regret_bot": 0.759801983833313, "value_dist": 0.45218056440353394, "value_other_env": 0.24356555938720703, "value_corner": 0.7651030421257019, "value_row": 0.42426183819770813, "value_any": 0.24356555938720703, "value_bot": 0.036887042224407196, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02630.png", "entropy": 0.04098522663116455} +{"ts": "2026-01-29T22:17:35.487854Z", "loop": 2640, "env_steps": 1622016000, "exact_value_avg": 0.4520037770271301, "regret_dist": 0.3517736494541168, "regret_other_env": 0.5862833261489868, "regret_corner": 9.085734745895024e-06, "regret_row": 0.3749576210975647, "regret_any": 0.5862833261489868, "regret_bot": 0.7590769529342651, "value_dist": 0.4520037770271301, "value_other_env": 0.24326980113983154, "value_corner": 0.7651047110557556, "value_row": 0.42173147201538086, "value_any": 0.24326980113983154, "value_bot": 0.03761204704642296, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02640.png", "entropy": 0.03992679715156555} +{"ts": "2026-01-29T22:17:47.158010Z", "loop": 2650, "env_steps": 1628160000, "exact_value_avg": 0.45219630002975464, "regret_dist": 0.3515811264514923, "regret_other_env": 0.5859518647193909, "regret_corner": 2.4960439986898564e-05, "regret_row": 0.3684140741825104, "regret_any": 0.5859518647193909, "regret_bot": 0.7623874545097351, "value_dist": 0.45219630002975464, "value_other_env": 0.24360129237174988, "value_corner": 0.7650887966156006, "value_row": 0.4282749891281128, "value_any": 0.24360129237174988, "value_bot": 0.03430165350437164, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02650.png", "entropy": 0.04540986195206642} +{"ts": "2026-01-29T22:17:58.820097Z", "loop": 2660, "env_steps": 1634304000, "exact_value_avg": 0.45272839069366455, "regret_dist": 0.3510489761829376, "regret_other_env": 0.585073709487915, "regret_corner": 1.1818111488537397e-05, "regret_row": 0.3684740662574768, "regret_any": 0.585073709487915, "regret_bot": 0.7613660097122192, "value_dist": 0.45272839069366455, "value_other_env": 0.24447940289974213, "value_corner": 0.7651019096374512, "value_row": 0.428214967250824, "value_any": 0.24447940289974213, "value_bot": 0.03532302752137184, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02660.png", "entropy": 0.04125337302684784} +{"ts": "2026-01-29T22:18:10.468082Z", "loop": 2670, "env_steps": 1640448000, "exact_value_avg": 0.4498614966869354, "regret_dist": 0.35391587018966675, "regret_other_env": 0.5898274779319763, "regret_corner": 4.8444671847391874e-05, "regret_row": 0.39620664715766907, "regret_any": 0.5898274779319763, "regret_bot": 0.7585795521736145, "value_dist": 0.4498614966869354, "value_other_env": 0.23972558975219727, "value_corner": 0.7650653123855591, "value_row": 0.4004823863506317, "value_any": 0.23972558975219727, "value_bot": 0.03810945898294449, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02670.png", "entropy": 0.0482606515288353} +{"ts": "2026-01-29T22:18:22.136736Z", "loop": 2680, "env_steps": 1646592000, "exact_value_avg": 0.4510512351989746, "regret_dist": 0.3527261018753052, "regret_other_env": 0.587851881980896, "regret_corner": 3.7369631172623485e-05, "regret_row": 0.3864192068576813, "regret_any": 0.587851881980896, "regret_bot": 0.75864577293396, "value_dist": 0.4510512351989746, "value_other_env": 0.2417011708021164, "value_corner": 0.7650763392448425, "value_row": 0.4102698564529419, "value_any": 0.2417011708021164, "value_bot": 0.03804325684905052, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02680.png", "entropy": 0.04886150360107422} +{"ts": "2026-01-29T22:18:33.799033Z", "loop": 2690, "env_steps": 1652736000, "exact_value_avg": 0.45271170139312744, "regret_dist": 0.35106566548347473, "regret_other_env": 0.5850991606712341, "regret_corner": 1.5405317753902636e-05, "regret_row": 0.37004491686820984, "regret_any": 0.5850991606712341, "regret_bot": 0.7597742676734924, "value_dist": 0.45271170139312744, "value_other_env": 0.24445396661758423, "value_corner": 0.7650983333587646, "value_row": 0.42664414644241333, "value_any": 0.24445396661758423, "value_bot": 0.036914702504873276, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02690.png", "entropy": 0.04606379196047783} +{"ts": "2026-01-29T22:18:45.452200Z", "loop": 2700, "env_steps": 1658880000, "exact_value_avg": 0.4527457356452942, "regret_dist": 0.35103169083595276, "regret_other_env": 0.5850425958633423, "regret_corner": 1.528114080429077e-05, "regret_row": 0.3696320354938507, "regret_any": 0.5850425958633423, "regret_bot": 0.7598634362220764, "value_dist": 0.4527457356452942, "value_other_env": 0.2445104867219925, "value_corner": 0.765098512172699, "value_row": 0.4270569980144501, "value_any": 0.2445104867219925, "value_bot": 0.03682560473680496, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02700.png", "entropy": 0.04623260721564293} +{"ts": "2026-01-29T22:18:57.106622Z", "loop": 2710, "env_steps": 1665024000, "exact_value_avg": 0.45277950167655945, "regret_dist": 0.3509978652000427, "regret_other_env": 0.5849854946136475, "regret_corner": 1.6390284145018086e-05, "regret_row": 0.3692671060562134, "regret_any": 0.5849854946136475, "regret_bot": 0.7599091529846191, "value_dist": 0.45277950167655945, "value_other_env": 0.24456758797168732, "value_corner": 0.7650973200798035, "value_row": 0.4274219870567322, "value_any": 0.24456758797168732, "value_bot": 0.03677985817193985, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02710.png", "entropy": 0.04717598110437393} +{"ts": "2026-01-29T22:19:08.785950Z", "loop": 2720, "env_steps": 1671168000, "exact_value_avg": 0.45307016372680664, "regret_dist": 0.35070717334747314, "regret_other_env": 0.584499180316925, "regret_corner": 1.916537803481333e-05, "regret_row": 0.36323800683021545, "regret_any": 0.584499180316925, "regret_bot": 0.7609670758247375, "value_dist": 0.45307016372680664, "value_other_env": 0.24505388736724854, "value_corner": 0.7650945782661438, "value_row": 0.4334510564804077, "value_any": 0.24505388736724854, "value_bot": 0.035722002387046814, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02720.png", "entropy": 0.05107447877526283} +{"ts": "2026-01-29T22:19:20.452153Z", "loop": 2730, "env_steps": 1677312000, "exact_value_avg": 0.45208364725112915, "regret_dist": 0.351693719625473, "regret_other_env": 0.5861294269561768, "regret_corner": 4.01263459934853e-05, "regret_row": 0.36202606558799744, "regret_any": 0.5861294269561768, "regret_bot": 0.7627741694450378, "value_dist": 0.45208364725112915, "value_other_env": 0.2434236854314804, "value_corner": 0.7650735378265381, "value_row": 0.43466299772262573, "value_any": 0.2434236854314804, "value_bot": 0.033914852887392044, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02730.png", "entropy": 0.0681481659412384} +{"ts": "2026-01-29T22:19:32.110724Z", "loop": 2740, "env_steps": 1683456000, "exact_value_avg": 0.4530234932899475, "regret_dist": 0.35075387358665466, "regret_other_env": 0.5845803022384644, "regret_corner": 1.4207264939614106e-05, "regret_row": 0.3641677796840668, "regret_any": 0.5845803022384644, "regret_bot": 0.7611569762229919, "value_dist": 0.4530234932899475, "value_other_env": 0.244972825050354, "value_corner": 0.7650995254516602, "value_row": 0.4325212836265564, "value_any": 0.244972825050354, "value_bot": 0.03553207963705063, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02740.png", "entropy": 0.04510875418782234} +{"ts": "2026-01-29T22:19:43.777201Z", "loop": 2750, "env_steps": 1689600000, "exact_value_avg": 0.4528956413269043, "regret_dist": 0.3508816957473755, "regret_other_env": 0.58479243516922, "regret_corner": 1.5562773114652373e-05, "regret_row": 0.36705872416496277, "regret_any": 0.58479243516922, "regret_bot": 0.7607040405273438, "value_dist": 0.4528956413269043, "value_other_env": 0.2447606474161148, "value_corner": 0.7650980949401855, "value_row": 0.4296303391456604, "value_any": 0.2447606474161148, "value_bot": 0.035985033959150314, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02750.png", "entropy": 0.04203222319483757} +{"ts": "2026-01-29T22:19:55.442874Z", "loop": 2760, "env_steps": 1695744000, "exact_value_avg": 0.4528372287750244, "regret_dist": 0.35094013810157776, "regret_other_env": 0.5848878026008606, "regret_corner": 1.8610557162901387e-05, "regret_row": 0.36817291378974915, "regret_any": 0.5848878026008606, "regret_bot": 0.7603185176849365, "value_dist": 0.4528372287750244, "value_other_env": 0.24466529488563538, "value_corner": 0.7650951147079468, "value_row": 0.4285161793231964, "value_any": 0.24466529488563538, "value_bot": 0.036370500922203064, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02760.png", "entropy": 0.042455073446035385} +{"ts": "2026-01-29T22:20:07.104398Z", "loop": 2770, "env_steps": 1701888000, "exact_value_avg": 0.4527602195739746, "regret_dist": 0.35101714730262756, "regret_other_env": 0.5850159525871277, "regret_corner": 1.8935899788630195e-05, "regret_row": 0.3692473769187927, "regret_any": 0.5850159525871277, "regret_bot": 0.759934663772583, "value_dist": 0.4527602195739746, "value_other_env": 0.2445371448993683, "value_corner": 0.7650948166847229, "value_row": 0.42744165658950806, "value_any": 0.2445371448993683, "value_bot": 0.03675440698862076, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02770.png", "entropy": 0.04255428537726402} +{"ts": "2026-01-29T22:20:18.760852Z", "loop": 2780, "env_steps": 1708032000, "exact_value_avg": 0.452994704246521, "regret_dist": 0.35078269243240356, "regret_other_env": 0.584625244140625, "regret_corner": 1.882116157503333e-05, "regret_row": 0.36345264315605164, "regret_any": 0.584625244140625, "regret_bot": 0.7615967392921448, "value_dist": 0.452994704246521, "value_other_env": 0.24492783844470978, "value_corner": 0.7650949358940125, "value_row": 0.43323639035224915, "value_any": 0.24492783844470978, "value_bot": 0.03509232774376869, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02780.png", "entropy": 0.046852026134729385} +{"ts": "2026-01-29T22:20:30.418746Z", "loop": 2790, "env_steps": 1714176000, "exact_value_avg": 0.452659010887146, "regret_dist": 0.3511183559894562, "regret_other_env": 0.5851820707321167, "regret_corner": 2.2744636225979775e-05, "regret_row": 0.36243873834609985, "regret_any": 0.5851820707321167, "regret_bot": 0.7625135183334351, "value_dist": 0.452659010887146, "value_other_env": 0.2443709522485733, "value_corner": 0.7650910019874573, "value_row": 0.4342503249645233, "value_any": 0.2443709522485733, "value_bot": 0.03417554870247841, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02790.png", "entropy": 0.054230302572250366} +{"ts": "2026-01-29T22:20:42.077888Z", "loop": 2800, "env_steps": 1720320000, "exact_value_avg": 0.45109689235687256, "regret_dist": 0.3526804745197296, "regret_other_env": 0.5877472162246704, "regret_corner": 8.034756319830194e-05, "regret_row": 0.36199361085891724, "regret_any": 0.5877472162246704, "regret_bot": 0.7633862495422363, "value_dist": 0.45109689235687256, "value_other_env": 0.24180589616298676, "value_corner": 0.7650333642959595, "value_row": 0.43469542264938354, "value_any": 0.24180589616298676, "value_bot": 0.033302780240774155, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02800.png", "entropy": 0.06805220991373062} +{"ts": "2026-01-29T22:20:53.742140Z", "loop": 2810, "env_steps": 1726464000, "exact_value_avg": 0.45293810963630676, "regret_dist": 0.3508392572402954, "regret_other_env": 0.5847187638282776, "regret_corner": 1.9963583326898515e-05, "regret_row": 0.36442482471466064, "regret_any": 0.5847187638282776, "regret_bot": 0.7616426348686218, "value_dist": 0.45293810963630676, "value_other_env": 0.2448343187570572, "value_corner": 0.7650938034057617, "value_row": 0.4322642683982849, "value_any": 0.2448343187570572, "value_bot": 0.03504641354084015, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02810.png", "entropy": 0.04455230385065079} +{"ts": "2026-01-29T22:21:05.395092Z", "loop": 2820, "env_steps": 1732608000, "exact_value_avg": 0.4530305862426758, "regret_dist": 0.350746750831604, "regret_other_env": 0.584567666053772, "regret_corner": 1.537799835205078e-05, "regret_row": 0.36431121826171875, "regret_any": 0.584567666053772, "regret_bot": 0.7609397172927856, "value_dist": 0.4530305862426758, "value_other_env": 0.2449854016304016, "value_corner": 0.7650983333587646, "value_row": 0.4323778450489044, "value_any": 0.2449854016304016, "value_bot": 0.03574938327074051, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02820.png", "entropy": 0.04342574253678322} +{"ts": "2026-01-29T22:21:17.064243Z", "loop": 2830, "env_steps": 1738752000, "exact_value_avg": 0.452985942363739, "regret_dist": 0.35079148411750793, "regret_other_env": 0.5846441984176636, "regret_corner": 1.2374421203276142e-05, "regret_row": 0.3659369945526123, "regret_any": 0.5846441984176636, "regret_bot": 0.7603707313537598, "value_dist": 0.452985942363739, "value_other_env": 0.2449089139699936, "value_corner": 0.765101432800293, "value_row": 0.4307520091533661, "value_any": 0.2449089139699936, "value_bot": 0.03631829842925072, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02830.png", "entropy": 0.04193738102912903} +{"ts": "2026-01-29T22:21:28.730446Z", "loop": 2840, "env_steps": 1744896000, "exact_value_avg": 0.4520055055618286, "regret_dist": 0.35177189111709595, "regret_other_env": 0.5862670540809631, "regret_corner": 2.9119850296410732e-05, "regret_row": 0.3767133057117462, "regret_any": 0.5862670540809631, "regret_bot": 0.7586809992790222, "value_dist": 0.4520055055618286, "value_other_env": 0.24328605830669403, "value_corner": 0.7650846242904663, "value_row": 0.41997572779655457, "value_any": 0.24328605830669403, "value_bot": 0.038008011877536774, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02840.png", "entropy": 0.04507629573345184} +{"ts": "2026-01-29T22:21:40.393225Z", "loop": 2850, "env_steps": 1751040000, "exact_value_avg": 0.4499448239803314, "regret_dist": 0.35383254289627075, "regret_other_env": 0.5885655879974365, "regret_corner": 0.0017329545225948095, "regret_row": 0.39433524012565613, "regret_any": 0.5885655879974365, "regret_bot": 0.7586078643798828, "value_dist": 0.4499448239803314, "value_other_env": 0.24098752439022064, "value_corner": 0.763380765914917, "value_row": 0.40235382318496704, "value_any": 0.24098752439022064, "value_bot": 0.03808118402957916, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02850.png", "entropy": 0.05325399711728096} +{"ts": "2026-01-29T22:21:52.054259Z", "loop": 2860, "env_steps": 1757184000, "exact_value_avg": 0.45291513204574585, "regret_dist": 0.3508622646331787, "regret_other_env": 0.5847563743591309, "regret_corner": 2.106676583935041e-05, "regret_row": 0.3673115372657776, "regret_any": 0.5847563743591309, "regret_bot": 0.7597901225090027, "value_dist": 0.45291513204574585, "value_other_env": 0.2447967827320099, "value_corner": 0.765092670917511, "value_row": 0.42937755584716797, "value_any": 0.2447967827320099, "value_bot": 0.03689894080162048, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02860.png", "entropy": 0.04721421003341675} +{"ts": "2026-01-29T22:22:03.718166Z", "loop": 2870, "env_steps": 1763328000, "exact_value_avg": 0.4530298411846161, "regret_dist": 0.35074758529663086, "regret_other_env": 0.5845583081245422, "regret_corner": 3.141065462841652e-05, "regret_row": 0.3626815676689148, "regret_any": 0.5845583081245422, "regret_bot": 0.7610228061676025, "value_dist": 0.4530298411846161, "value_other_env": 0.24499480426311493, "value_corner": 0.7650823593139648, "value_row": 0.434007465839386, "value_any": 0.24499480426311493, "value_bot": 0.035666223615407944, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02870.png", "entropy": 0.05209038779139519} +{"ts": "2026-01-29T22:22:15.363207Z", "loop": 2880, "env_steps": 1769472000, "exact_value_avg": 0.4530490040779114, "regret_dist": 0.35072842240333557, "regret_other_env": 0.5845290422439575, "regret_corner": 2.7478736228658818e-05, "regret_row": 0.36448490619659424, "regret_any": 0.5845290422439575, "regret_bot": 0.7602571845054626, "value_dist": 0.4530490040779114, "value_other_env": 0.24502414464950562, "value_corner": 0.7650862336158752, "value_row": 0.43220415711402893, "value_any": 0.24502414464950562, "value_bot": 0.03643185645341873, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02880.png", "entropy": 0.047193191945552826} +{"ts": "2026-01-29T22:22:27.018783Z", "loop": 2890, "env_steps": 1775616000, "exact_value_avg": 0.4524204730987549, "regret_dist": 0.3513568937778473, "regret_other_env": 0.5855669379234314, "regret_corner": 4.181414988124743e-05, "regret_row": 0.3749367892742157, "regret_any": 0.5855669379234314, "regret_bot": 0.7592054605484009, "value_dist": 0.4524204730987549, "value_other_env": 0.2439861297607422, "value_corner": 0.7650719285011292, "value_row": 0.42175227403640747, "value_any": 0.2439861297607422, "value_bot": 0.0374835766851902, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02890.png", "entropy": 0.05075516924262047} +{"ts": "2026-01-29T22:22:38.685163Z", "loop": 2900, "env_steps": 1781760000, "exact_value_avg": 0.45271220803260803, "regret_dist": 0.35106518864631653, "regret_other_env": 0.5850934386253357, "regret_corner": 2.2770962459617294e-05, "regret_row": 0.3705562949180603, "regret_any": 0.5850934386253357, "regret_bot": 0.7595219612121582, "value_dist": 0.45271220803260803, "value_other_env": 0.24445970356464386, "value_corner": 0.7650909423828125, "value_row": 0.4261327385902405, "value_any": 0.24445970356464386, "value_bot": 0.03716708719730377, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02900.png", "entropy": 0.04834497347474098} +{"ts": "2026-01-29T22:22:50.351823Z", "loop": 2910, "env_steps": 1787904000, "exact_value_avg": 0.45298945903778076, "regret_dist": 0.3507879376411438, "regret_other_env": 0.5846324563026428, "regret_corner": 2.1149715394130908e-05, "regret_row": 0.36590638756752014, "regret_any": 0.5846324563026428, "regret_bot": 0.7599338889122009, "value_dist": 0.45298945903778076, "value_other_env": 0.24492067098617554, "value_corner": 0.7650925517082214, "value_row": 0.4307827055454254, "value_any": 0.24492067098617554, "value_bot": 0.036755193024873734, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02910.png", "entropy": 0.04627436771988869} +{"ts": "2026-01-29T22:23:02.019975Z", "loop": 2920, "env_steps": 1794048000, "exact_value_avg": 0.45306509733200073, "regret_dist": 0.35071223974227905, "regret_other_env": 0.5845001339912415, "regret_corner": 3.037899841729086e-05, "regret_row": 0.3627711236476898, "regret_any": 0.5845001339912415, "regret_bot": 0.7609003782272339, "value_dist": 0.45306509733200073, "value_other_env": 0.24505293369293213, "value_corner": 0.765083372592926, "value_row": 0.43391796946525574, "value_any": 0.24505293369293213, "value_bot": 0.035788644105196, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02920.png", "entropy": 0.05075736716389656} +{"ts": "2026-01-29T22:23:13.681843Z", "loop": 2930, "env_steps": 1800192000, "exact_value_avg": 0.4515167474746704, "regret_dist": 0.35226067900657654, "regret_other_env": 0.5870541930198669, "regret_corner": 7.037222530925646e-05, "regret_row": 0.36203137040138245, "regret_any": 0.5870541930198669, "regret_bot": 0.7632713317871094, "value_dist": 0.4515167474746704, "value_other_env": 0.24249893426895142, "value_corner": 0.7650433778762817, "value_row": 0.4346576929092407, "value_any": 0.24249893426895142, "value_bot": 0.03341773524880409, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02930.png", "entropy": 0.06738025695085526} +{"ts": "2026-01-29T22:23:25.343752Z", "loop": 2940, "env_steps": 1806336000, "exact_value_avg": 0.4473103880882263, "regret_dist": 0.35646703839302063, "regret_other_env": 0.5940352082252502, "regret_corner": 0.00011473497579572722, "regret_row": 0.3619672656059265, "regret_any": 0.5940352082252502, "regret_bot": 0.7654480934143066, "value_dist": 0.4473103880882263, "value_other_env": 0.2355179637670517, "value_corner": 0.7649990320205688, "value_row": 0.43472176790237427, "value_any": 0.2355179637670517, "value_bot": 0.031240979209542274, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02940.png", "entropy": 0.06814984232187271} +{"ts": "2026-01-29T22:23:37.003294Z", "loop": 2950, "env_steps": 1812480000, "exact_value_avg": 0.45267659425735474, "regret_dist": 0.35110077261924744, "regret_other_env": 0.5851486921310425, "regret_corner": 2.881288673961535e-05, "regret_row": 0.36612990498542786, "regret_any": 0.5851486921310425, "regret_bot": 0.7623013257980347, "value_dist": 0.45267659425735474, "value_other_env": 0.24440445005893707, "value_corner": 0.7650848627090454, "value_row": 0.43055909872055054, "value_any": 0.24440445005893707, "value_bot": 0.034387677907943726, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02950.png", "entropy": 0.03937835991382599} +{"ts": "2026-01-29T22:23:48.661001Z", "loop": 2960, "env_steps": 1818624000, "exact_value_avg": 0.45238763093948364, "regret_dist": 0.3513897955417633, "regret_other_env": 0.5856404304504395, "regret_corner": 1.3770660189038608e-05, "regret_row": 0.3666543960571289, "regret_any": 0.5856404304504395, "regret_bot": 0.7624101042747498, "value_dist": 0.45238763093948364, "value_other_env": 0.24391265213489532, "value_corner": 0.7651000022888184, "value_row": 0.4300346374511719, "value_any": 0.24391265213489532, "value_bot": 0.03427891433238983, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02960.png", "entropy": 0.03972984105348587} +{"ts": "2026-01-29T22:24:00.322440Z", "loop": 2970, "env_steps": 1824768000, "exact_value_avg": 0.45258545875549316, "regret_dist": 0.35119184851646423, "regret_other_env": 0.5853086709976196, "regret_corner": 1.662025897530839e-05, "regret_row": 0.368561327457428, "regret_any": 0.5853086709976196, "regret_bot": 0.7623026967048645, "value_dist": 0.45258545875549316, "value_other_env": 0.24424438178539276, "value_corner": 0.7650970816612244, "value_row": 0.4281277060508728, "value_any": 0.24424438178539276, "value_bot": 0.0343862920999527, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02970.png", "entropy": 0.03604874014854431} +{"ts": "2026-01-29T22:24:11.992165Z", "loop": 2980, "env_steps": 1830912000, "exact_value_avg": 0.4526578187942505, "regret_dist": 0.35111960768699646, "regret_other_env": 0.5851869583129883, "regret_corner": 1.8580258256406523e-05, "regret_row": 0.36869192123413086, "regret_any": 0.5851869583129883, "regret_bot": 0.7620822787284851, "value_dist": 0.4526578187942505, "value_other_env": 0.24436618387699127, "value_corner": 0.7650951743125916, "value_row": 0.4279971718788147, "value_any": 0.24436618387699127, "value_bot": 0.03460678830742836, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02980.png", "entropy": 0.03550572320818901} +{"ts": "2026-01-29T22:24:23.651976Z", "loop": 2990, "env_steps": 1837056000, "exact_value_avg": 0.4526698887348175, "regret_dist": 0.3511074483394623, "regret_other_env": 0.585161030292511, "regret_corner": 2.7044616217608564e-05, "regret_row": 0.369620680809021, "regret_any": 0.585161030292511, "regret_bot": 0.7597159147262573, "value_dist": 0.4526698887348175, "value_other_env": 0.2443920373916626, "value_corner": 0.7650866508483887, "value_row": 0.4270683526992798, "value_any": 0.2443920373916626, "value_bot": 0.036973074078559875, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_02990.png", "entropy": 0.03530290350317955} +{"ts": "2026-01-29T22:24:35.305044Z", "loop": 3000, "env_steps": 1843200000, "exact_value_avg": 0.4507863223552704, "regret_dist": 0.3529910445213318, "regret_other_env": 0.5883103013038635, "regret_corner": 1.2134512871853076e-05, "regret_row": 0.3878929316997528, "regret_any": 0.5883103013038635, "regret_bot": 0.758570671081543, "value_dist": 0.4507863223552704, "value_other_env": 0.24124279618263245, "value_corner": 0.7651016116142273, "value_row": 0.4087960720062256, "value_any": 0.24124279618263245, "value_bot": 0.03811833634972572, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_03000.png", "entropy": 0.03925994038581848} +{"ts": "2026-01-29T22:24:46.958369Z", "loop": 3010, "env_steps": 1849344000, "exact_value_avg": 0.4508052468299866, "regret_dist": 0.352972149848938, "regret_other_env": 0.5880104899406433, "regret_corner": 0.00041461389628238976, "regret_row": 0.3883112967014313, "regret_any": 0.5880104899406433, "regret_bot": 0.7586416602134705, "value_dist": 0.4508052468299866, "value_other_env": 0.24154262244701385, "value_corner": 0.7646991014480591, "value_row": 0.4083777666091919, "value_any": 0.24154262244701385, "value_bot": 0.038047343492507935, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_03010.png", "entropy": 0.047363460063934326} +{"ts": "2026-01-29T22:24:58.641699Z", "loop": 3020, "env_steps": 1855488000, "exact_value_avg": 0.4517875611782074, "regret_dist": 0.35198983550071716, "regret_other_env": 0.5862575173377991, "regret_corner": 0.0005882879486307502, "regret_row": 0.379425048828125, "regret_any": 0.5862575173377991, "regret_bot": 0.7593971490859985, "value_dist": 0.4517875611782074, "value_other_env": 0.24329562485218048, "value_corner": 0.7645254135131836, "value_row": 0.4172639548778534, "value_any": 0.24329562485218048, "value_bot": 0.03729189932346344, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_03020.png", "entropy": 0.05031033232808113} +{"ts": "2026-01-29T22:25:10.302092Z", "loop": 3030, "env_steps": 1861632000, "exact_value_avg": 0.4530588388442993, "regret_dist": 0.35071849822998047, "regret_other_env": 0.5845170617103577, "regret_corner": 2.0653011233662255e-05, "regret_row": 0.3651440441608429, "regret_any": 0.5845170617103577, "regret_bot": 0.7599751353263855, "value_dist": 0.4530588388442993, "value_other_env": 0.2450360208749771, "value_corner": 0.7650930285453796, "value_row": 0.4315449893474579, "value_any": 0.2450360208749771, "value_bot": 0.0367138609290123, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_03030.png", "entropy": 0.05021044984459877} +{"ts": "2026-01-29T22:25:21.955171Z", "loop": 3040, "env_steps": 1867776000, "exact_value_avg": 0.45311301946640015, "regret_dist": 0.3506644070148468, "regret_other_env": 0.5844259858131409, "regret_corner": 2.1950902009848505e-05, "regret_row": 0.3625938892364502, "regret_any": 0.5844259858131409, "regret_bot": 0.7607479095458984, "value_dist": 0.45311301946640015, "value_other_env": 0.2451271116733551, "value_corner": 0.7650918364524841, "value_row": 0.43409520387649536, "value_any": 0.2451271116733551, "value_bot": 0.035941172391176224, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_03040.png", "entropy": 0.05331304296851158} +{"ts": "2026-01-29T22:25:33.616083Z", "loop": 3050, "env_steps": 1873920000, "exact_value_avg": 0.45311152935028076, "regret_dist": 0.3506658375263214, "regret_other_env": 0.5844258666038513, "regret_corner": 2.5742750949575566e-05, "regret_row": 0.3623528480529785, "regret_any": 0.5844258666038513, "regret_bot": 0.7608615756034851, "value_dist": 0.45311152935028076, "value_other_env": 0.24512717127799988, "value_corner": 0.7650880217552185, "value_row": 0.4343361556529999, "value_any": 0.24512717127799988, "value_bot": 0.03582748398184776, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_03050.png", "entropy": 0.052858028560876846} +{"ts": "2026-01-29T22:25:45.271301Z", "loop": 3060, "env_steps": 1880064000, "exact_value_avg": 0.4531601071357727, "regret_dist": 0.3506172001361847, "regret_other_env": 0.5843493342399597, "regret_corner": 1.899401468108408e-05, "regret_row": 0.36299005150794983, "regret_any": 0.5843493342399597, "regret_bot": 0.7603644132614136, "value_dist": 0.4531601071357727, "value_other_env": 0.24520374834537506, "value_corner": 0.7650946974754333, "value_row": 0.43369898200035095, "value_any": 0.24520374834537506, "value_bot": 0.03632460907101631, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_03060.png", "entropy": 0.04685327783226967} +{"ts": "2026-01-29T22:25:56.935342Z", "loop": 3070, "env_steps": 1886208000, "exact_value_avg": 0.45316171646118164, "regret_dist": 0.3506157100200653, "regret_other_env": 0.5843479037284851, "regret_corner": 1.7325084627373144e-05, "regret_row": 0.36320117115974426, "regret_any": 0.5843479037284851, "regret_bot": 0.7602695822715759, "value_dist": 0.45316171646118164, "value_other_env": 0.24520517885684967, "value_corner": 0.7650964260101318, "value_row": 0.4334878623485565, "value_any": 0.24520517885684967, "value_bot": 0.03641940653324127, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_03070.png", "entropy": 0.044404152780771255} +{"ts": "2026-01-29T22:26:08.593429Z", "loop": 3080, "env_steps": 1892352000, "exact_value_avg": 0.4524843990802765, "regret_dist": 0.3512929379940033, "regret_other_env": 0.5854314565658569, "regret_corner": 8.514325600117445e-05, "regret_row": 0.3741791248321533, "regret_any": 0.5854314565658569, "regret_bot": 0.7594989538192749, "value_dist": 0.4524843990802765, "value_other_env": 0.24412155151367188, "value_corner": 0.7650286555290222, "value_row": 0.4225098788738251, "value_any": 0.24412155151367188, "value_bot": 0.03719014301896095, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_03080.png", "entropy": 0.04845563694834709} +{"ts": "2026-01-29T22:26:20.248187Z", "loop": 3090, "env_steps": 1898496000, "exact_value_avg": 0.44897881150245667, "regret_dist": 0.3547985553741455, "regret_other_env": 0.5894281268119812, "regret_corner": 0.0028541909996420145, "regret_row": 0.4086066782474518, "regret_any": 0.5894281268119812, "regret_bot": 0.7588661313056946, "value_dist": 0.44897881150245667, "value_other_env": 0.24012495577335358, "value_corner": 0.7622596025466919, "value_row": 0.3880824148654938, "value_any": 0.24012495577335358, "value_bot": 0.037822917103767395, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_03090.png", "entropy": 0.051028475165367126} +{"ts": "2026-01-29T22:26:31.902758Z", "loop": 3100, "env_steps": 1904640000, "exact_value_avg": 0.452046662569046, "regret_dist": 0.35173070430755615, "regret_other_env": 0.5861716866493225, "regret_corner": 6.924172339495271e-05, "regret_row": 0.3819287121295929, "regret_any": 0.5861716866493225, "regret_bot": 0.7593387365341187, "value_dist": 0.452046662569046, "value_other_env": 0.24338141083717346, "value_corner": 0.7650445103645325, "value_row": 0.4147603213787079, "value_any": 0.24338141083717346, "value_bot": 0.0373503603041172, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_03100.png", "entropy": 0.04939521476626396} +{"ts": "2026-01-29T22:26:43.567429Z", "loop": 3110, "env_steps": 1910784000, "exact_value_avg": 0.4483625888824463, "regret_dist": 0.3554147779941559, "regret_other_env": 0.5919223427772522, "regret_corner": 0.0006534054991789162, "regret_row": 0.4358091652393341, "regret_any": 0.5919223427772522, "regret_bot": 0.7588290572166443, "value_dist": 0.4483625888824463, "value_other_env": 0.23763078451156616, "value_corner": 0.7644602656364441, "value_row": 0.36087989807128906, "value_any": 0.23763078451156616, "value_bot": 0.03785998001694679, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_03110.png", "entropy": 0.05322970449924469} +{"ts": "2026-01-29T22:26:55.233919Z", "loop": 3120, "env_steps": 1916928000, "exact_value_avg": 0.45119547843933105, "regret_dist": 0.3525818884372711, "regret_other_env": 0.5875715613365173, "regret_corner": 9.739349479787052e-05, "regret_row": 0.39645227789878845, "regret_any": 0.5875715613365173, "regret_bot": 0.7592913508415222, "value_dist": 0.45119547843933105, "value_other_env": 0.24198155105113983, "value_corner": 0.7650163173675537, "value_row": 0.4002368152141571, "value_any": 0.24198155105113983, "value_bot": 0.037397678941488266, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_03120.png", "entropy": 0.05011444166302681} +{"ts": "2026-01-29T22:27:06.895042Z", "loop": 3130, "env_steps": 1923072000, "exact_value_avg": 0.4529390335083008, "regret_dist": 0.3508383333683014, "regret_other_env": 0.584708034992218, "regret_corner": 3.37253040925134e-05, "regret_row": 0.3671351373195648, "regret_any": 0.584708034992218, "regret_bot": 0.7598963975906372, "value_dist": 0.4529390335083008, "value_other_env": 0.24484506249427795, "value_corner": 0.7650799751281738, "value_row": 0.42955389618873596, "value_any": 0.24484506249427795, "value_bot": 0.03679263964295387, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_03130.png", "entropy": 0.0457971915602684} +{"ts": "2026-01-29T22:27:18.558200Z", "loop": 3140, "env_steps": 1929216000, "exact_value_avg": 0.4529868960380554, "regret_dist": 0.35079050064086914, "regret_other_env": 0.5846357345581055, "regret_corner": 2.2674601495964453e-05, "regret_row": 0.3621925711631775, "regret_any": 0.5846357345581055, "regret_bot": 0.761364221572876, "value_dist": 0.4529868960380554, "value_other_env": 0.2449173778295517, "value_corner": 0.7650911211967468, "value_row": 0.4344964921474457, "value_any": 0.2449173778295517, "value_bot": 0.035324882715940475, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_03140.png", "entropy": 0.04956941306591034} +{"ts": "2026-01-29T22:27:30.219174Z", "loop": 3150, "env_steps": 1935360000, "exact_value_avg": 0.45300763845443726, "regret_dist": 0.3507697284221649, "regret_other_env": 0.5846035480499268, "regret_corner": 1.8990536773344502e-05, "regret_row": 0.36232876777648926, "regret_any": 0.5846035480499268, "regret_bot": 0.7614937424659729, "value_dist": 0.45300763845443726, "value_other_env": 0.2449495643377304, "value_corner": 0.7650947570800781, "value_row": 0.4343602955341339, "value_any": 0.2449495643377304, "value_bot": 0.03519529104232788, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_03150.png", "entropy": 0.04524897783994675} +{"ts": "2026-01-29T22:27:41.883479Z", "loop": 3160, "env_steps": 1941504000, "exact_value_avg": 0.45310255885124207, "regret_dist": 0.3506748080253601, "regret_other_env": 0.5844469666481018, "regret_corner": 1.6530355424038135e-05, "regret_row": 0.36316633224487305, "regret_any": 0.5844469666481018, "regret_bot": 0.7610041499137878, "value_dist": 0.45310255885124207, "value_other_env": 0.24510611593723297, "value_corner": 0.7650972008705139, "value_row": 0.43352270126342773, "value_any": 0.24510611593723297, "value_bot": 0.03568488359451294, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_03160.png", "entropy": 0.03850826621055603} +{"ts": "2026-01-29T22:27:53.548076Z", "loop": 3170, "env_steps": 1947648000, "exact_value_avg": 0.45312148332595825, "regret_dist": 0.3506558835506439, "regret_other_env": 0.5844171047210693, "regret_corner": 1.403192709403811e-05, "regret_row": 0.36285117268562317, "regret_any": 0.5844171047210693, "regret_bot": 0.7610583305358887, "value_dist": 0.45312148332595825, "value_other_env": 0.24513596296310425, "value_corner": 0.7650997638702393, "value_row": 0.433837890625, "value_any": 0.24513596296310425, "value_bot": 0.035630691796541214, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_03170.png", "entropy": 0.03900793194770813} +{"ts": "2026-01-29T22:28:05.209911Z", "loop": 3180, "env_steps": 1953792000, "exact_value_avg": 0.45303165912628174, "regret_dist": 0.3507457375526428, "regret_other_env": 0.5845640897750854, "regret_corner": 1.8196305973106064e-05, "regret_row": 0.36490073800086975, "regret_any": 0.5845640897750854, "regret_bot": 0.76068115234375, "value_dist": 0.45303165912628174, "value_other_env": 0.24498900771141052, "value_corner": 0.7650955319404602, "value_row": 0.43178829550743103, "value_any": 0.24498900771141052, "value_bot": 0.03600792586803436, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_03180.png", "entropy": 0.03714814782142639} +{"ts": "2026-01-29T22:28:16.872729Z", "loop": 3190, "env_steps": 1959936000, "exact_value_avg": 0.45263946056365967, "regret_dist": 0.3511379063129425, "regret_other_env": 0.5852175951004028, "regret_corner": 1.829415668908041e-05, "regret_row": 0.3718414902687073, "regret_any": 0.5852175951004028, "regret_bot": 0.7596362233161926, "value_dist": 0.45263946056365967, "value_other_env": 0.24433547258377075, "value_corner": 0.7650954127311707, "value_row": 0.4248475730419159, "value_any": 0.24433547258377075, "value_bot": 0.037052810192108154, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_03190.png", "entropy": 0.039788927882909775} +{"ts": "2026-01-29T22:28:28.539560Z", "loop": 3200, "env_steps": 1966080000, "exact_value_avg": 0.4529556930065155, "regret_dist": 0.35082167387008667, "regret_other_env": 0.5846778154373169, "regret_corner": 3.7399928260128945e-05, "regret_row": 0.3668467402458191, "regret_any": 0.5846778154373169, "regret_bot": 0.7599395513534546, "value_dist": 0.4529556930065155, "value_other_env": 0.2448752373456955, "value_corner": 0.7650763392448425, "value_row": 0.4298422932624817, "value_any": 0.2448752373456955, "value_bot": 0.03674949333071709, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_03200.png", "entropy": 0.04364027455449104} +{"ts": "2026-01-29T22:28:40.201419Z", "loop": 3210, "env_steps": 1972224000, "exact_value_avg": 0.4531075656414032, "regret_dist": 0.35066983103752136, "regret_other_env": 0.5844342112541199, "regret_corner": 2.3229918951983564e-05, "regret_row": 0.3623788356781006, "regret_any": 0.5844342112541199, "regret_bot": 0.7610160708427429, "value_dist": 0.4531075656414032, "value_other_env": 0.24511893093585968, "value_corner": 0.7650904655456543, "value_row": 0.4343101978302002, "value_any": 0.24511893093585968, "value_bot": 0.03567298501729965, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_03210.png", "entropy": 0.047914423048496246} +{"ts": "2026-01-29T22:28:51.869109Z", "loop": 3220, "env_steps": 1978368000, "exact_value_avg": 0.4531070590019226, "regret_dist": 0.35067033767700195, "regret_other_env": 0.5844367742538452, "regret_corner": 2.0653011233662255e-05, "regret_row": 0.3626500368118286, "regret_any": 0.5844367742538452, "regret_bot": 0.7608436346054077, "value_dist": 0.4531070590019226, "value_other_env": 0.24511632323265076, "value_corner": 0.7650930881500244, "value_row": 0.43403905630111694, "value_any": 0.24511632323265076, "value_bot": 0.035845477133989334, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_03220.png", "entropy": 0.04599328711628914} +{"ts": "2026-01-29T22:29:03.528511Z", "loop": 3230, "env_steps": 1984512000, "exact_value_avg": 0.4530583620071411, "regret_dist": 0.35071903467178345, "regret_other_env": 0.5845159888267517, "regret_corner": 2.353241143282503e-05, "regret_row": 0.36235108971595764, "regret_any": 0.5845159888267517, "regret_bot": 0.7610760927200317, "value_dist": 0.4530583620071411, "value_other_env": 0.24503712356090546, "value_corner": 0.7650902271270752, "value_row": 0.4343380033969879, "value_any": 0.24503712356090546, "value_bot": 0.03561299666762352, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_03230.png", "entropy": 0.048123035579919815} +{"ts": "2026-01-29T22:29:15.192717Z", "loop": 3240, "env_steps": 1990656000, "exact_value_avg": 0.45309677720069885, "regret_dist": 0.3506805896759033, "regret_other_env": 0.5844582915306091, "regret_corner": 1.3993681022839155e-05, "regret_row": 0.36401447653770447, "regret_any": 0.5844582915306091, "regret_bot": 0.7602627873420715, "value_dist": 0.45309677720069885, "value_other_env": 0.24509477615356445, "value_corner": 0.7650997638702393, "value_row": 0.4326746165752411, "value_any": 0.24509477615356445, "value_bot": 0.03642624244093895, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_03240.png", "entropy": 0.04055923968553543} +{"ts": "2026-01-29T22:29:26.857961Z", "loop": 3250, "env_steps": 1996800000, "exact_value_avg": 0.4527699053287506, "regret_dist": 0.3510074317455292, "regret_other_env": 0.584998607635498, "regret_corner": 2.0623705495381728e-05, "regret_row": 0.37001585960388184, "regret_any": 0.584998607635498, "regret_bot": 0.7597167491912842, "value_dist": 0.4527699053287506, "value_other_env": 0.24455443024635315, "value_corner": 0.7650930881500244, "value_row": 0.42667317390441895, "value_any": 0.24455443024635315, "value_bot": 0.03697231411933899, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_03250.png", "entropy": 0.04057992994785309} +{"ts": "2026-01-29T22:29:38.520200Z", "loop": 3260, "env_steps": 2002944000, "exact_value_avg": 0.4526711106300354, "regret_dist": 0.35110628604888916, "regret_other_env": 0.5851636528968811, "regret_corner": 2.0168723494862206e-05, "regret_row": 0.37148648500442505, "regret_any": 0.5851636528968811, "regret_bot": 0.7596702575683594, "value_dist": 0.4526711106300354, "value_other_env": 0.24438945949077606, "value_corner": 0.7650935649871826, "value_row": 0.4252026081085205, "value_any": 0.24438945949077606, "value_bot": 0.037018779665231705, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_03260.png", "entropy": 0.03995019569993019} +{"ts": "2026-01-29T22:29:50.174948Z", "loop": 3270, "env_steps": 2009088000, "exact_value_avg": 0.45299631357192993, "regret_dist": 0.35078099370002747, "regret_other_env": 0.5846258997917175, "regret_corner": 1.3651450899487827e-05, "regret_row": 0.36601829528808594, "regret_any": 0.5846258997917175, "regret_bot": 0.7599496245384216, "value_dist": 0.45299631357192993, "value_other_env": 0.24492712318897247, "value_corner": 0.7651001214981079, "value_row": 0.43067076802253723, "value_any": 0.24492712318897247, "value_bot": 0.03673938289284706, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_03270.png", "entropy": 0.039649415761232376} +{"ts": "2026-01-29T22:30:01.829192Z", "loop": 3280, "env_steps": 2015232000, "exact_value_avg": 0.4530746340751648, "regret_dist": 0.3507027328014374, "regret_other_env": 0.5844953656196594, "regret_corner": 1.3806423339701723e-05, "regret_row": 0.3648546636104584, "regret_any": 0.5844953656196594, "regret_bot": 0.7600609660148621, "value_dist": 0.4530746340751648, "value_other_env": 0.24505779147148132, "value_corner": 0.7650998830795288, "value_row": 0.4318344295024872, "value_any": 0.24505779147148132, "value_bot": 0.03662804141640663, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_03280.png", "entropy": 0.0416770800948143} +{"ts": "2026-01-29T22:30:13.491819Z", "loop": 3290, "env_steps": 2021376000, "exact_value_avg": 0.45314258337020874, "regret_dist": 0.35063478350639343, "regret_other_env": 0.5843836069107056, "regret_corner": 1.1528532013471704e-05, "regret_row": 0.36297154426574707, "regret_any": 0.5843836069107056, "regret_bot": 0.7605923414230347, "value_dist": 0.45314258337020874, "value_other_env": 0.24516946077346802, "value_corner": 0.765102207660675, "value_row": 0.4337174594402313, "value_any": 0.24516946077346802, "value_bot": 0.03609670326113701, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_03290.png", "entropy": 0.04454267397522926} +{"ts": "2026-01-29T22:30:25.156659Z", "loop": 3300, "env_steps": 2027520000, "exact_value_avg": 0.4530883729457855, "regret_dist": 0.35068899393081665, "regret_other_env": 0.5844719409942627, "regret_corner": 1.4517705494654365e-05, "regret_row": 0.3621751368045807, "regret_any": 0.5844719409942627, "regret_bot": 0.7610732316970825, "value_dist": 0.4530883729457855, "value_other_env": 0.24508118629455566, "value_corner": 0.7650991678237915, "value_row": 0.4345138967037201, "value_any": 0.24508118629455566, "value_bot": 0.03561578318476677, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_03300.png", "entropy": 0.049361806362867355} +{"ts": "2026-01-29T22:30:36.817494Z", "loop": 3310, "env_steps": 2033664000, "exact_value_avg": 0.44210219383239746, "regret_dist": 0.3616752028465271, "regret_other_env": 0.5997175574302673, "regret_corner": 0.004611646290868521, "regret_row": 0.3678213655948639, "regret_any": 0.5997175574302673, "regret_bot": 0.7676499485969543, "value_dist": 0.44210219383239746, "value_other_env": 0.22983556985855103, "value_corner": 0.7605020403862, "value_row": 0.4288676679134369, "value_any": 0.22983556985855103, "value_bot": 0.029039081186056137, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_03310.png", "entropy": 0.08902992308139801} +{"ts": "2026-01-29T22:30:48.485063Z", "loop": 3320, "env_steps": 2039808000, "exact_value_avg": 0.45308077335357666, "regret_dist": 0.3506966531276703, "regret_other_env": 0.5844851732254028, "regret_corner": 1.3862054402125068e-05, "regret_row": 0.363362193107605, "regret_any": 0.5844851732254028, "regret_bot": 0.7608699798583984, "value_dist": 0.45308077335357666, "value_other_env": 0.2450679987668991, "value_corner": 0.7650998830795288, "value_row": 0.4333268404006958, "value_any": 0.2450679987668991, "value_bot": 0.03581906855106354, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_03320.png", "entropy": 0.03470638021826744} +{"ts": "2026-01-29T22:31:00.157505Z", "loop": 3330, "env_steps": 2045952000, "exact_value_avg": 0.4526997208595276, "regret_dist": 0.3510775864124298, "regret_other_env": 0.5851206183433533, "regret_corner": 1.305838486587163e-05, "regret_row": 0.36975619196891785, "regret_any": 0.5851206183433533, "regret_bot": 0.7598271369934082, "value_dist": 0.4526997208595276, "value_other_env": 0.24443241953849792, "value_corner": 0.7651006579399109, "value_row": 0.4269328713417053, "value_any": 0.24443241953849792, "value_bot": 0.03686192259192467, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_03330.png", "entropy": 0.03235196694731712} +{"ts": "2026-01-29T22:31:11.822697Z", "loop": 3340, "env_steps": 2052096000, "exact_value_avg": 0.45168036222457886, "regret_dist": 0.3520970046520233, "regret_other_env": 0.5868013501167297, "regret_corner": 4.0451686800224707e-05, "regret_row": 0.3674362897872925, "regret_any": 0.5868013501167297, "regret_bot": 0.7629384398460388, "value_dist": 0.45168036222457886, "value_other_env": 0.24275171756744385, "value_corner": 0.765073299407959, "value_row": 0.4292527437210083, "value_any": 0.24275171756744385, "value_bot": 0.033750612288713455, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_03340.png", "entropy": 0.03543392941355705} +{"ts": "2026-01-29T22:31:23.480888Z", "loop": 3350, "env_steps": 2058240000, "exact_value_avg": 0.45282506942749023, "regret_dist": 0.35095229744911194, "regret_other_env": 0.5849153995513916, "regret_corner": 7.607539828313747e-06, "regret_row": 0.36860668659210205, "regret_any": 0.5849153995513916, "regret_bot": 0.7606599926948547, "value_dist": 0.45282506942749023, "value_other_env": 0.24463769793510437, "value_corner": 0.7651061415672302, "value_row": 0.42808234691619873, "value_any": 0.24463769793510437, "value_bot": 0.03602904453873634, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_03350.png", "entropy": 0.030367203056812286} +{"ts": "2026-01-29T22:31:35.149139Z", "loop": 3360, "env_steps": 2064384000, "exact_value_avg": 0.4519461989402771, "regret_dist": 0.3518311679363251, "regret_other_env": 0.5863820910453796, "regret_corner": 4.7892335715005174e-06, "regret_row": 0.37963640689849854, "regret_any": 0.5863820910453796, "regret_bot": 0.7587411999702454, "value_dist": 0.4519461989402771, "value_other_env": 0.24317105114459991, "value_corner": 0.7651088833808899, "value_row": 0.41705265641212463, "value_any": 0.24317105114459991, "value_bot": 0.03794782608747482, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_03360.png", "entropy": 0.03368876874446869} +{"ts": "2026-01-29T22:31:46.826165Z", "loop": 3370, "env_steps": 2070528000, "exact_value_avg": 0.4515570104122162, "regret_dist": 0.352220356464386, "regret_other_env": 0.5870253443717957, "regret_corner": 1.2835860616178252e-05, "regret_row": 0.3860578238964081, "regret_any": 0.5870253443717957, "regret_bot": 0.7586733102798462, "value_dist": 0.4515570104122162, "value_other_env": 0.24252772331237793, "value_corner": 0.76510089635849, "value_row": 0.4106312096118927, "value_any": 0.24252772331237793, "value_bot": 0.03801579028367996, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_03370.png", "entropy": 0.03805983439087868} +{"ts": "2026-01-29T22:31:58.502529Z", "loop": 3380, "env_steps": 2076672000, "exact_value_avg": 0.4528093934059143, "regret_dist": 0.35096800327301025, "regret_other_env": 0.5849435925483704, "regret_corner": 4.637241545424331e-06, "regret_row": 0.36990857124328613, "regret_any": 0.5849435925483704, "regret_bot": 0.7596558928489685, "value_dist": 0.4528093934059143, "value_other_env": 0.2446095496416092, "value_corner": 0.765109121799469, "value_row": 0.42678046226501465, "value_any": 0.2446095496416092, "value_bot": 0.037033166736364365, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_03380.png", "entropy": 0.03446441888809204} +{"ts": "2026-01-29T22:32:10.159734Z", "loop": 3390, "env_steps": 2082816000, "exact_value_avg": 0.45312976837158203, "regret_dist": 0.35064759850502014, "regret_other_env": 0.5844081044197083, "regret_corner": 6.75270985084353e-06, "regret_row": 0.3643701672554016, "regret_any": 0.5844081044197083, "regret_bot": 0.760089635848999, "value_dist": 0.45312976837158203, "value_other_env": 0.24514497816562653, "value_corner": 0.7651069760322571, "value_row": 0.43231892585754395, "value_any": 0.24514497816562653, "value_bot": 0.03659942001104355, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_03390.png", "entropy": 0.03385448828339577} +{"ts": "2026-01-29T22:32:21.829471Z", "loop": 3400, "env_steps": 2088960000, "exact_value_avg": 0.4530984163284302, "regret_dist": 0.350678950548172, "regret_other_env": 0.5844616293907166, "regret_corner": 4.887084287474863e-06, "regret_row": 0.3651093542575836, "regret_any": 0.5844616293907166, "regret_bot": 0.7599043846130371, "value_dist": 0.4530984163284302, "value_other_env": 0.24509143829345703, "value_corner": 0.7651088237762451, "value_row": 0.43157970905303955, "value_any": 0.24509143829345703, "value_bot": 0.036784663796424866, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_03400.png", "entropy": 0.03477206453680992} +{"ts": "2026-01-29T22:32:33.499908Z", "loop": 3410, "env_steps": 2095104000, "exact_value_avg": 0.4531782865524292, "regret_dist": 0.35059911012649536, "regret_other_env": 0.5843283534049988, "regret_corner": 5.2213672461220995e-06, "regret_row": 0.3634239435195923, "regret_any": 0.5843283534049988, "regret_bot": 0.7601701021194458, "value_dist": 0.4531782865524292, "value_other_env": 0.2452247440814972, "value_corner": 0.7651085257530212, "value_row": 0.4332650601863861, "value_any": 0.2452247440814972, "value_bot": 0.03651892766356468, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_03410.png", "entropy": 0.03576593101024628} +{"ts": "2026-01-29T22:32:45.163027Z", "loop": 3420, "env_steps": 2101248000, "exact_value_avg": 0.4528893828392029, "regret_dist": 0.3508880138397217, "regret_other_env": 0.5847997069358826, "regret_corner": 2.0391744328662753e-05, "regret_row": 0.36874204874038696, "regret_any": 0.5847997069358826, "regret_bot": 0.7597565650939941, "value_dist": 0.4528893828392029, "value_other_env": 0.24475343525409698, "value_corner": 0.7650933265686035, "value_row": 0.42794695496559143, "value_any": 0.24475343525409698, "value_bot": 0.03693244233727455, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_03420.png", "entropy": 0.03978068009018898} +{"ts": "2026-01-29T22:32:56.828016Z", "loop": 3430, "env_steps": 2107392000, "exact_value_avg": 0.45304715633392334, "regret_dist": 0.3507302403450012, "regret_other_env": 0.5845354795455933, "regret_corner": 2.2352736777975224e-05, "regret_row": 0.36594080924987793, "regret_any": 0.5845354795455933, "regret_bot": 0.7598513960838318, "value_dist": 0.45304715633392334, "value_other_env": 0.2450176328420639, "value_corner": 0.7650913596153259, "value_row": 0.43074825406074524, "value_any": 0.2450176328420639, "value_bot": 0.03683767095208168, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_03430.png", "entropy": 0.04105280712246895} +{"ts": "2026-01-29T22:33:08.494379Z", "loop": 3440, "env_steps": 2113536000, "exact_value_avg": 0.453152060508728, "regret_dist": 0.35062533617019653, "regret_other_env": 0.584369957447052, "regret_corner": 8.319815606228076e-06, "regret_row": 0.36400917172431946, "regret_any": 0.584369957447052, "regret_bot": 0.7600249648094177, "value_dist": 0.453152060508728, "value_other_env": 0.24518314003944397, "value_corner": 0.7651054263114929, "value_row": 0.4326798617839813, "value_any": 0.24518314003944397, "value_bot": 0.03666405379772186, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_03440.png", "entropy": 0.03911091014742851} +{"ts": "2026-01-29T22:33:20.178160Z", "loop": 3450, "env_steps": 2119680000, "exact_value_avg": 0.45313918590545654, "regret_dist": 0.350638210773468, "regret_other_env": 0.5843912959098816, "regret_corner": 8.538365364074707e-06, "regret_row": 0.36433345079421997, "regret_any": 0.5843912959098816, "regret_bot": 0.759928286075592, "value_dist": 0.45313918590545654, "value_other_env": 0.245161771774292, "value_corner": 0.7651052474975586, "value_row": 0.4323556125164032, "value_any": 0.245161771774292, "value_bot": 0.036760762333869934, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_03450.png", "entropy": 0.0389377735555172} +{"ts": "2026-01-29T22:33:31.851336Z", "loop": 3460, "env_steps": 2125824000, "exact_value_avg": 0.4531291127204895, "regret_dist": 0.3506482243537903, "regret_other_env": 0.5844070315361023, "regret_corner": 1.0005633157561533e-05, "regret_row": 0.3645516633987427, "regret_any": 0.5844070315361023, "regret_bot": 0.7598889470100403, "value_dist": 0.4531291127204895, "value_other_env": 0.24514606595039368, "value_corner": 0.7651036977767944, "value_row": 0.4321373999118805, "value_any": 0.24514606595039368, "value_bot": 0.0368000864982605, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_03460.png", "entropy": 0.03941868990659714} +{"ts": "2026-01-29T22:33:43.519698Z", "loop": 3470, "env_steps": 2131968000, "exact_value_avg": 0.4530760645866394, "regret_dist": 0.35070133209228516, "regret_other_env": 0.5844908356666565, "regret_corner": 1.70300409081392e-05, "regret_row": 0.3655337393283844, "regret_any": 0.5844908356666565, "regret_bot": 0.7598074674606323, "value_dist": 0.4530760645866394, "value_other_env": 0.24506224691867828, "value_corner": 0.7650967240333557, "value_row": 0.4311552941799164, "value_any": 0.24506224691867828, "value_bot": 0.03688155114650726, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_03470.png", "entropy": 0.039993975311517715} +{"ts": "2026-01-29T22:33:55.192534Z", "loop": 3480, "env_steps": 2138112000, "exact_value_avg": 0.45320188999176025, "regret_dist": 0.3505755066871643, "regret_other_env": 0.5842857956886292, "regret_corner": 1.00264951470308e-05, "regret_row": 0.36229127645492554, "regret_any": 0.5842857956886292, "regret_bot": 0.760672390460968, "value_dist": 0.45320188999176025, "value_other_env": 0.2452673465013504, "value_corner": 0.7651036977767944, "value_row": 0.43439778685569763, "value_any": 0.2452673465013504, "value_bot": 0.036016643047332764, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_03480.png", "entropy": 0.039005208760499954} +{"ts": "2026-01-29T22:34:06.850746Z", "loop": 3490, "env_steps": 2144256000, "exact_value_avg": 0.4531211853027344, "regret_dist": 0.3506561815738678, "regret_other_env": 0.5844136476516724, "regret_corner": 1.996457649511285e-05, "regret_row": 0.3619576096534729, "regret_any": 0.5844136476516724, "regret_bot": 0.7611085772514343, "value_dist": 0.4531211853027344, "value_other_env": 0.24513942003250122, "value_corner": 0.7650938034057617, "value_row": 0.43473145365715027, "value_any": 0.24513942003250122, "value_bot": 0.03558051213622093, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_03490.png", "entropy": 0.04222462698817253} +{"ts": "2026-01-29T22:34:18.506037Z", "loop": 3500, "env_steps": 2150400000, "exact_value_avg": 0.45228123664855957, "regret_dist": 0.3514961302280426, "regret_other_env": 0.5858125686645508, "regret_corner": 2.1474561435752548e-05, "regret_row": 0.3619847893714905, "regret_any": 0.5858125686645508, "regret_bot": 0.7630006670951843, "value_dist": 0.45228123664855957, "value_other_env": 0.2437405288219452, "value_corner": 0.7650922536849976, "value_row": 0.4347042441368103, "value_any": 0.2437405288219452, "value_bot": 0.03368842229247093, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_03500.png", "entropy": 0.05454528331756592} +{"ts": "2026-01-29T22:34:30.170113Z", "loop": 3510, "env_steps": 2156544000, "exact_value_avg": 0.4529910981655121, "regret_dist": 0.3507862985134125, "regret_other_env": 0.5846287608146667, "regret_corner": 2.254694845760241e-05, "regret_row": 0.3624403476715088, "regret_any": 0.5846287608146667, "regret_bot": 0.761210024356842, "value_dist": 0.4529910981655121, "value_other_env": 0.24492432177066803, "value_corner": 0.7650912404060364, "value_row": 0.4342486560344696, "value_any": 0.24492432177066803, "value_bot": 0.03547903150320053, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_03510.png", "entropy": 0.03632856905460358} +{"ts": "2026-01-29T22:34:41.831143Z", "loop": 3520, "env_steps": 2162688000, "exact_value_avg": 0.45257771015167236, "regret_dist": 0.3511996567249298, "regret_other_env": 0.5853054523468018, "regret_corner": 4.093498137081042e-05, "regret_row": 0.36590906977653503, "regret_any": 0.5853054523468018, "regret_bot": 0.7609736919403076, "value_dist": 0.45257771015167236, "value_other_env": 0.24424761533737183, "value_corner": 0.7650728225708008, "value_row": 0.43077996373176575, "value_any": 0.24424761533737183, "value_bot": 0.035715363919734955, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_03520.png", "entropy": 0.03291520103812218} +{"ts": "2026-01-29T22:34:53.500891Z", "loop": 3530, "env_steps": 2168832000, "exact_value_avg": 0.4525153636932373, "regret_dist": 0.35126200318336487, "regret_other_env": 0.5854043364524841, "regret_corner": 4.846950469072908e-05, "regret_row": 0.36454764008522034, "regret_any": 0.5854043364524841, "regret_bot": 0.761939525604248, "value_dist": 0.4525153636932373, "value_other_env": 0.24414870142936707, "value_corner": 0.7650653123855591, "value_row": 0.43214136362075806, "value_any": 0.24414870142936707, "value_bot": 0.034749504178762436, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_03530.png", "entropy": 0.032417379319667816} +{"ts": "2026-01-29T22:35:05.171719Z", "loop": 3540, "env_steps": 2174976000, "exact_value_avg": 0.45209288597106934, "regret_dist": 0.35168448090553284, "regret_other_env": 0.586122989654541, "regret_corner": 2.670934009074699e-05, "regret_row": 0.36295148730278015, "regret_any": 0.586122989654541, "regret_bot": 0.7626943588256836, "value_dist": 0.45209288597106934, "value_other_env": 0.24343010783195496, "value_corner": 0.7650870680809021, "value_row": 0.433737576007843, "value_any": 0.24343010783195496, "value_bot": 0.03399473801255226, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_03540.png", "entropy": 0.033716458827257156} +{"ts": "2026-01-29T22:35:16.833900Z", "loop": 3550, "env_steps": 2181120000, "exact_value_avg": 0.452984094619751, "regret_dist": 0.3507933020591736, "regret_other_env": 0.5846289992332458, "regret_corner": 3.971159821958281e-05, "regret_row": 0.36481475830078125, "regret_any": 0.5846289992332458, "regret_bot": 0.7613682150840759, "value_dist": 0.452984094619751, "value_other_env": 0.24492409825325012, "value_corner": 0.7650740742683411, "value_row": 0.43187424540519714, "value_any": 0.24492409825325012, "value_bot": 0.03532079979777336, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_03550.png", "entropy": 0.030348392203450203} +{"ts": "2026-01-29T22:35:28.495969Z", "loop": 3560, "env_steps": 2187264000, "exact_value_avg": 0.45286622643470764, "regret_dist": 0.35091114044189453, "regret_other_env": 0.5848445296287537, "regret_corner": 1.1024872947018594e-05, "regret_row": 0.3627227246761322, "regret_any": 0.5848445296287537, "regret_bot": 0.7624977231025696, "value_dist": 0.45286622643470764, "value_other_env": 0.24470855295658112, "value_corner": 0.7651026844978333, "value_row": 0.43396633863449097, "value_any": 0.24470855295658112, "value_bot": 0.03419136255979538, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_03560.png", "entropy": 0.03282921388745308} +{"ts": "2026-01-29T22:35:40.163227Z", "loop": 3570, "env_steps": 2193408000, "exact_value_avg": 0.4530634880065918, "regret_dist": 0.35071390867233276, "regret_other_env": 0.5845149159431458, "regret_corner": 1.2395779776852578e-05, "regret_row": 0.3627064824104309, "regret_any": 0.5845149159431458, "regret_bot": 0.7619854211807251, "value_dist": 0.4530634880065918, "value_other_env": 0.245038241147995, "value_corner": 0.7651013731956482, "value_row": 0.4339825510978699, "value_any": 0.245038241147995, "value_bot": 0.03470364585518837, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_03570.png", "entropy": 0.032279565930366516} +{"ts": "2026-01-29T22:35:51.824720Z", "loop": 3580, "env_steps": 2199552000, "exact_value_avg": 0.45311686396598816, "regret_dist": 0.350660502910614, "regret_other_env": 0.5844258069992065, "regret_corner": 1.2518466064648237e-05, "regret_row": 0.36286869645118713, "regret_any": 0.5844258069992065, "regret_bot": 0.7614656090736389, "value_dist": 0.45311686396598816, "value_other_env": 0.24512726068496704, "value_corner": 0.7651011943817139, "value_row": 0.4338203966617584, "value_any": 0.24512726068496704, "value_bot": 0.035223450511693954, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_03580.png", "entropy": 0.031266212463378906} +{"ts": "2026-01-29T22:36:03.485117Z", "loop": 3590, "env_steps": 2205696000, "exact_value_avg": 0.453071653842926, "regret_dist": 0.35070574283599854, "regret_other_env": 0.5845033526420593, "regret_corner": 9.29832549445564e-06, "regret_row": 0.36239808797836304, "regret_any": 0.5845033526420593, "regret_bot": 0.7622126340866089, "value_dist": 0.453071653842926, "value_other_env": 0.24504970014095306, "value_corner": 0.7651044726371765, "value_row": 0.43429097533226013, "value_any": 0.24504970014095306, "value_bot": 0.03447645902633667, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_03590.png", "entropy": 0.03385419398546219} +{"ts": "2026-01-29T22:36:15.139895Z", "loop": 3600, "env_steps": 2211840000, "exact_value_avg": 0.45314693450927734, "regret_dist": 0.3506304919719696, "regret_other_env": 0.5843715071678162, "regret_corner": 1.89577549463138e-05, "regret_row": 0.36238735914230347, "regret_any": 0.5843715071678162, "regret_bot": 0.7614660263061523, "value_dist": 0.45314693450927734, "value_other_env": 0.2451816350221634, "value_corner": 0.7650948166847229, "value_row": 0.4343017041683197, "value_any": 0.2451816350221634, "value_bot": 0.03522302955389023, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_03600.png", "entropy": 0.0336582325398922} +{"ts": "2026-01-29T22:36:26.807252Z", "loop": 3610, "env_steps": 2217984000, "exact_value_avg": 0.453097939491272, "regret_dist": 0.3506794273853302, "regret_other_env": 0.5844584107398987, "regret_corner": 1.0960798135783989e-05, "regret_row": 0.36225321888923645, "regret_any": 0.5844584107398987, "regret_bot": 0.7620899081230164, "value_dist": 0.453097939491272, "value_other_env": 0.24509470164775848, "value_corner": 0.765102744102478, "value_row": 0.4344358444213867, "value_any": 0.24509470164775848, "value_bot": 0.03459909185767174, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_03610.png", "entropy": 0.03623030334711075} +{"ts": "2026-01-29T22:36:38.486425Z", "loop": 3620, "env_steps": 2224128000, "exact_value_avg": 0.44806361198425293, "regret_dist": 0.35571378469467163, "regret_other_env": 0.5927637815475464, "regret_corner": 0.0001387159136356786, "regret_row": 0.36286982893943787, "regret_any": 0.5927637815475464, "regret_bot": 0.7664835453033447, "value_dist": 0.44806361198425293, "value_other_env": 0.23678933084011078, "value_corner": 0.7649750113487244, "value_row": 0.4338192045688629, "value_any": 0.23678933084011078, "value_bot": 0.030205465853214264, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_03620.png", "entropy": 0.05932850390672684} +{"ts": "2026-01-29T22:36:50.147645Z", "loop": 3630, "env_steps": 2230272000, "exact_value_avg": 0.45156747102737427, "regret_dist": 0.3522098660469055, "regret_other_env": 0.5870035290718079, "regret_corner": 1.9343695385032333e-05, "regret_row": 0.36192551255226135, "regret_any": 0.5870035290718079, "regret_bot": 0.7645171880722046, "value_dist": 0.45156747102737427, "value_other_env": 0.24254955351352692, "value_corner": 0.7650943994522095, "value_row": 0.43476352095603943, "value_any": 0.24254955351352692, "value_bot": 0.0321718193590641, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_03630.png", "entropy": 0.05092238262295723} +{"ts": "2026-01-29T22:37:01.810077Z", "loop": 3640, "env_steps": 2236416000, "exact_value_avg": 0.4530063569545746, "regret_dist": 0.35077103972435, "regret_other_env": 0.5846118330955505, "regret_corner": 9.845197382674087e-06, "regret_row": 0.36211639642715454, "regret_any": 0.5846118330955505, "regret_bot": 0.7623308897018433, "value_dist": 0.4530063569545746, "value_other_env": 0.24494129419326782, "value_corner": 0.7651038765907288, "value_row": 0.43457266688346863, "value_any": 0.24494129419326782, "value_bot": 0.03435814380645752, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_03640.png", "entropy": 0.037530310451984406} +{"ts": "2026-01-29T22:37:13.467923Z", "loop": 3650, "env_steps": 2242560000, "exact_value_avg": 0.45303934812545776, "regret_dist": 0.3507380783557892, "regret_other_env": 0.5845571756362915, "regret_corner": 9.36637388804229e-06, "regret_row": 0.3623943328857422, "regret_any": 0.5845571756362915, "regret_bot": 0.7623284459114075, "value_dist": 0.45303934812545776, "value_other_env": 0.24499593675136566, "value_corner": 0.7651044130325317, "value_row": 0.434294730424881, "value_any": 0.24499593675136566, "value_bot": 0.03436066582798958, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_03650.png", "entropy": 0.03340926393866539} +{"ts": "2026-01-29T22:37:25.122900Z", "loop": 3660, "env_steps": 2248704000, "exact_value_avg": 0.4530893564224243, "regret_dist": 0.35068798065185547, "regret_other_env": 0.5844744443893433, "regret_corner": 8.260707545559853e-06, "regret_row": 0.3630417287349701, "regret_any": 0.5844744443893433, "regret_bot": 0.7619753479957581, "value_dist": 0.4530893564224243, "value_other_env": 0.24507862329483032, "value_corner": 0.7651054859161377, "value_row": 0.4336472749710083, "value_any": 0.24507862329483032, "value_bot": 0.03471372649073601, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_03660.png", "entropy": 0.030194584280252457} +{"ts": "2026-01-29T22:37:36.777726Z", "loop": 3670, "env_steps": 2254848000, "exact_value_avg": 0.45213282108306885, "regret_dist": 0.3516445755958557, "regret_other_env": 0.5860653519630432, "regret_corner": 1.3379256415646523e-05, "regret_row": 0.3619287610054016, "regret_any": 0.5860653519630432, "regret_bot": 0.7634795904159546, "value_dist": 0.45213282108306885, "value_other_env": 0.24348776042461395, "value_corner": 0.7651003003120422, "value_row": 0.43476033210754395, "value_any": 0.24348776042461395, "value_bot": 0.033209480345249176, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_03670.png", "entropy": 0.041852712631225586} +{"ts": "2026-01-29T22:37:48.432826Z", "loop": 3680, "env_steps": 2260992000, "exact_value_avg": 0.4527227580547333, "regret_dist": 0.3510545790195465, "regret_other_env": 0.5850830674171448, "regret_corner": 1.1843443644465879e-05, "regret_row": 0.3628140389919281, "regret_any": 0.5850830674171448, "regret_bot": 0.7626730799674988, "value_dist": 0.4527227580547333, "value_other_env": 0.24446998536586761, "value_corner": 0.7651019096374512, "value_row": 0.4338749945163727, "value_any": 0.24446998536586761, "value_bot": 0.03401593491435051, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_03680.png", "entropy": 0.032333094626665115} +{"ts": "2026-01-29T22:38:00.089391Z", "loop": 3690, "env_steps": 2267136000, "exact_value_avg": 0.45035791397094727, "regret_dist": 0.3534194529056549, "regret_other_env": 0.5890259742736816, "regret_corner": 9.630124623072334e-06, "regret_row": 0.3619628846645355, "regret_any": 0.5890259742736816, "regret_bot": 0.7644086480140686, "value_dist": 0.45035791397094727, "value_other_env": 0.24052704870700836, "value_corner": 0.7651041150093079, "value_row": 0.43472617864608765, "value_any": 0.24052704870700836, "value_bot": 0.032280486077070236, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_03690.png", "entropy": 0.040345415472984314} +{"ts": "2026-01-29T22:38:11.752506Z", "loop": 3700, "env_steps": 2273280000, "exact_value_avg": 0.44815802574157715, "regret_dist": 0.355619341135025, "regret_other_env": 0.5926712155342102, "regret_corner": 4.15032118326053e-05, "regret_row": 0.361918568611145, "regret_any": 0.5926712155342102, "regret_bot": 0.7664800882339478, "value_dist": 0.44815802574157715, "value_other_env": 0.23688186705112457, "value_corner": 0.765072226524353, "value_row": 0.43477052450180054, "value_any": 0.23688186705112457, "value_bot": 0.03020891547203064, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_03700.png", "entropy": 0.04764719307422638} +{"ts": "2026-01-29T22:38:23.403436Z", "loop": 3710, "env_steps": 2279424000, "exact_value_avg": 0.4526880979537964, "regret_dist": 0.3510892987251282, "regret_other_env": 0.5851437449455261, "regret_corner": 7.581711088278098e-06, "regret_row": 0.36224550008773804, "regret_any": 0.5851437449455261, "regret_bot": 0.7625938653945923, "value_dist": 0.4526880979537964, "value_other_env": 0.24440932273864746, "value_corner": 0.765106201171875, "value_row": 0.43444350361824036, "value_any": 0.24440932273864746, "value_bot": 0.034095220267772675, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_03710.png", "entropy": 0.0339704304933548} +{"ts": "2026-01-29T22:38:35.061937Z", "loop": 3720, "env_steps": 2285568000, "exact_value_avg": 0.4528208076953888, "regret_dist": 0.35095658898353577, "regret_other_env": 0.5849239826202393, "regret_corner": 5.421539299277356e-06, "regret_row": 0.36896249651908875, "regret_any": 0.5849239826202393, "regret_bot": 0.7597419023513794, "value_dist": 0.4528208076953888, "value_other_env": 0.2446291148662567, "value_corner": 0.7651082873344421, "value_row": 0.4277265965938568, "value_any": 0.2446291148662567, "value_bot": 0.03694714978337288, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_03720.png", "entropy": 0.02740139327943325} +{"ts": "2026-01-29T22:38:46.720570Z", "loop": 3730, "env_steps": 2291712000, "exact_value_avg": 0.4520428776741028, "regret_dist": 0.35173457860946655, "regret_other_env": 0.58621746301651, "regret_corner": 1.0180473509535659e-05, "regret_row": 0.37523409724235535, "regret_any": 0.58621746301651, "regret_bot": 0.7588633894920349, "value_dist": 0.4520428776741028, "value_other_env": 0.24333569407463074, "value_corner": 0.7651035785675049, "value_row": 0.4214549660682678, "value_any": 0.24333569407463074, "value_bot": 0.037825681269168854, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_03730.png", "entropy": 0.03261115401983261} +{"ts": "2026-01-29T22:38:58.392892Z", "loop": 3740, "env_steps": 2297856000, "exact_value_avg": 0.4512021243572235, "regret_dist": 0.3525752127170563, "regret_other_env": 0.5868334174156189, "regret_corner": 0.0011878793593496084, "regret_row": 0.37635117769241333, "regret_any": 0.5868334174156189, "regret_bot": 0.7589828968048096, "value_dist": 0.4512021243572235, "value_other_env": 0.2427196353673935, "value_corner": 0.7639258503913879, "value_row": 0.42033788561820984, "value_any": 0.2427196353673935, "value_bot": 0.037706103175878525, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_03740.png", "entropy": 0.03731361776590347} +{"ts": "2026-01-29T22:39:10.059180Z", "loop": 3750, "env_steps": 2304000000, "exact_value_avg": 0.45282572507858276, "regret_dist": 0.3509516417980194, "regret_other_env": 0.5849138498306274, "regret_corner": 8.293986866192427e-06, "regret_row": 0.3694840669631958, "regret_any": 0.5849138498306274, "regret_bot": 0.7597165107727051, "value_dist": 0.45282572507858276, "value_other_env": 0.24463920295238495, "value_corner": 0.7651054859161377, "value_row": 0.427204966545105, "value_any": 0.24463920295238495, "value_bot": 0.036972496658563614, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_03750.png", "entropy": 0.033381178975105286} +{"ts": "2026-01-29T22:39:21.719105Z", "loop": 3760, "env_steps": 2310144000, "exact_value_avg": 0.45312684774398804, "regret_dist": 0.3506505489349365, "regret_other_env": 0.584408164024353, "regret_corner": 1.405229249940021e-05, "regret_row": 0.3645498752593994, "regret_any": 0.584408164024353, "regret_bot": 0.7598535418510437, "value_dist": 0.45312684774398804, "value_other_env": 0.24514493346214294, "value_corner": 0.7650996446609497, "value_row": 0.43213915824890137, "value_any": 0.24514493346214294, "value_bot": 0.03683554381132126, "action_probs_image_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611/action_probs/img_03760.png", "entropy": 0.032201722264289856} diff --git a/al_0.6_g_0.97_id_11_seed_970611/eval.log b/al_0.6_g_0.97_id_11_seed_970611/eval.log new file mode 100644 index 0000000000000000000000000000000000000000..52283f86b346b36094ff2338504a11952446ef4d --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/eval.log @@ -0,0 +1,852 @@ +[2026-01-29T21:25:57.740706Z] Loop 0: Reg: 0.7080, AltReg: 0.7103, CorReg: 0.7044, TopReg: 0.7088, AllReg: 0.7103, BotRReg: 0.7089, OV: 0.0958, AltV: 0.1193, CorV: 0.0607, TopV: 0.0879, BotRV: 0.0878, AllV: 0.1193 +[2026-01-29T21:25:59.016902Z] Loop 1: Reg: 0.7076, AltReg: 0.7103, CorReg: 0.7036, TopReg: 0.7082, AllReg: 0.7103, BotRReg: 0.7094, OV: 0.0961, AltV: 0.1193, CorV: 0.0615, TopV: 0.0884, BotRV: 0.0873, AllV: 0.1193 +[2026-01-29T21:26:00.230766Z] Loop 2: Reg: 0.7073, AltReg: 0.7103, CorReg: 0.7029, TopReg: 0.7077, AllReg: 0.7103, BotRReg: 0.7099, OV: 0.0965, AltV: 0.1193, CorV: 0.0622, TopV: 0.0890, BotRV: 0.0868, AllV: 0.1193 +[2026-01-29T21:26:01.436844Z] Loop 3: Reg: 0.7070, AltReg: 0.7103, CorReg: 0.7021, TopReg: 0.7072, AllReg: 0.7103, BotRReg: 0.7104, OV: 0.0968, AltV: 0.1193, CorV: 0.0630, TopV: 0.0895, BotRV: 0.0863, AllV: 0.1193 +[2026-01-29T21:26:02.642410Z] Loop 4: Reg: 0.7067, AltReg: 0.7103, CorReg: 0.7014, TopReg: 0.7067, AllReg: 0.7103, BotRReg: 0.7109, OV: 0.0971, AltV: 0.1193, CorV: 0.0637, TopV: 0.0900, BotRV: 0.0858, AllV: 0.1193 +[2026-01-29T21:26:03.846492Z] Loop 5: Reg: 0.7064, AltReg: 0.7103, CorReg: 0.7006, TopReg: 0.7062, AllReg: 0.7103, BotRReg: 0.7114, OV: 0.0974, AltV: 0.1193, CorV: 0.0645, TopV: 0.0905, BotRV: 0.0853, AllV: 0.1193 +[2026-01-29T21:26:05.052930Z] Loop 6: Reg: 0.7061, AltReg: 0.7102, CorReg: 0.6999, TopReg: 0.7057, AllReg: 0.7102, BotRReg: 0.7118, OV: 0.0977, AltV: 0.1193, CorV: 0.0652, TopV: 0.0910, BotRV: 0.0849, AllV: 0.1193 +[2026-01-29T21:26:06.271669Z] Loop 7: Reg: 0.7058, AltReg: 0.7102, CorReg: 0.6992, TopReg: 0.7052, AllReg: 0.7102, BotRReg: 0.7123, OV: 0.0980, AltV: 0.1193, CorV: 0.0659, TopV: 0.0915, BotRV: 0.0844, AllV: 0.1193 +[2026-01-29T21:26:07.484643Z] Loop 8: Reg: 0.7055, AltReg: 0.7102, CorReg: 0.6985, TopReg: 0.7047, AllReg: 0.7102, BotRReg: 0.7127, OV: 0.0982, AltV: 0.1193, CorV: 0.0666, TopV: 0.0920, BotRV: 0.0840, AllV: 0.1193 +[2026-01-29T21:26:08.691765Z] Loop 9: Reg: 0.7052, AltReg: 0.7102, CorReg: 0.6977, TopReg: 0.7042, AllReg: 0.7102, BotRReg: 0.7132, OV: 0.0985, AltV: 0.1193, CorV: 0.0674, TopV: 0.0925, BotRV: 0.0835, AllV: 0.1193 +[2026-01-29T21:26:09.896591Z] Loop 10: Reg: 0.7049, AltReg: 0.7102, CorReg: 0.6970, TopReg: 0.7037, AllReg: 0.7102, BotRReg: 0.7136, OV: 0.0988, AltV: 0.1193, CorV: 0.0681, TopV: 0.0929, BotRV: 0.0831, AllV: 0.1193 +[2026-01-29T21:26:11.099014Z] Loop 11: Reg: 0.7046, AltReg: 0.7102, CorReg: 0.6962, TopReg: 0.7032, AllReg: 0.7102, BotRReg: 0.7141, OV: 0.0992, AltV: 0.1193, CorV: 0.0689, TopV: 0.0934, BotRV: 0.0826, AllV: 0.1193 +[2026-01-29T21:26:12.303683Z] Loop 12: Reg: 0.7043, AltReg: 0.7102, CorReg: 0.6954, TopReg: 0.7027, AllReg: 0.7102, BotRReg: 0.7146, OV: 0.0995, AltV: 0.1193, CorV: 0.0697, TopV: 0.0940, BotRV: 0.0821, AllV: 0.1193 +[2026-01-29T21:26:13.514111Z] Loop 13: Reg: 0.7040, AltReg: 0.7103, CorReg: 0.6945, TopReg: 0.7022, AllReg: 0.7103, BotRReg: 0.7151, OV: 0.0998, AltV: 0.1193, CorV: 0.0706, TopV: 0.0945, BotRV: 0.0816, AllV: 0.1193 +[2026-01-29T21:26:14.724583Z] Loop 14: Reg: 0.7036, AltReg: 0.7103, CorReg: 0.6936, TopReg: 0.7017, AllReg: 0.7103, BotRReg: 0.7156, OV: 0.1002, AltV: 0.1193, CorV: 0.0715, TopV: 0.0950, BotRV: 0.0811, AllV: 0.1193 +[2026-01-29T21:26:15.929380Z] Loop 15: Reg: 0.7032, AltReg: 0.7103, CorReg: 0.6927, TopReg: 0.7011, AllReg: 0.7103, BotRReg: 0.7161, OV: 0.1005, AltV: 0.1193, CorV: 0.0724, TopV: 0.0956, BotRV: 0.0806, AllV: 0.1193 +[2026-01-29T21:26:17.131668Z] Loop 16: Reg: 0.7029, AltReg: 0.7103, CorReg: 0.6917, TopReg: 0.7005, AllReg: 0.7103, BotRReg: 0.7166, OV: 0.1009, AltV: 0.1193, CorV: 0.0734, TopV: 0.0962, BotRV: 0.0801, AllV: 0.1193 +[2026-01-29T21:26:18.336201Z] Loop 17: Reg: 0.7025, AltReg: 0.7103, CorReg: 0.6907, TopReg: 0.6999, AllReg: 0.7103, BotRReg: 0.7171, OV: 0.1013, AltV: 0.1193, CorV: 0.0744, TopV: 0.0968, BotRV: 0.0796, AllV: 0.1193 +[2026-01-29T21:26:19.544394Z] Loop 18: Reg: 0.7021, AltReg: 0.7103, CorReg: 0.6897, TopReg: 0.6993, AllReg: 0.7103, BotRReg: 0.7177, OV: 0.1017, AltV: 0.1193, CorV: 0.0754, TopV: 0.0974, BotRV: 0.0790, AllV: 0.1193 +[2026-01-29T21:26:20.750471Z] Loop 19: Reg: 0.7016, AltReg: 0.7103, CorReg: 0.6886, TopReg: 0.6987, AllReg: 0.7103, BotRReg: 0.7182, OV: 0.1022, AltV: 0.1192, CorV: 0.0765, TopV: 0.0980, BotRV: 0.0785, AllV: 0.1192 +[2026-01-29T21:26:21.958664Z] Loop 20: Reg: 0.7012, AltReg: 0.7103, CorReg: 0.6874, TopReg: 0.6980, AllReg: 0.7103, BotRReg: 0.7188, OV: 0.1026, AltV: 0.1192, CorV: 0.0777, TopV: 0.0987, BotRV: 0.0779, AllV: 0.1192 +[2026-01-29T21:26:23.164854Z] Loop 21: Reg: 0.7007, AltReg: 0.7103, CorReg: 0.6862, TopReg: 0.6973, AllReg: 0.7103, BotRReg: 0.7194, OV: 0.1031, AltV: 0.1192, CorV: 0.0789, TopV: 0.0994, BotRV: 0.0773, AllV: 0.1192 +[2026-01-29T21:26:24.376835Z] Loop 22: Reg: 0.7002, AltReg: 0.7104, CorReg: 0.6850, TopReg: 0.6966, AllReg: 0.7104, BotRReg: 0.7200, OV: 0.1036, AltV: 0.1192, CorV: 0.0801, TopV: 0.1001, BotRV: 0.0767, AllV: 0.1192 +[2026-01-29T21:26:25.579391Z] Loop 23: Reg: 0.6997, AltReg: 0.7104, CorReg: 0.6837, TopReg: 0.6959, AllReg: 0.7104, BotRReg: 0.7206, OV: 0.1041, AltV: 0.1192, CorV: 0.0815, TopV: 0.1008, BotRV: 0.0761, AllV: 0.1192 +[2026-01-29T21:26:26.782397Z] Loop 24: Reg: 0.6992, AltReg: 0.7104, CorReg: 0.6823, TopReg: 0.6951, AllReg: 0.7104, BotRReg: 0.7212, OV: 0.1046, AltV: 0.1191, CorV: 0.0828, TopV: 0.1016, BotRV: 0.0754, AllV: 0.1191 +[2026-01-29T21:26:27.985042Z] Loop 25: Reg: 0.6986, AltReg: 0.7104, CorReg: 0.6808, TopReg: 0.6943, AllReg: 0.7104, BotRReg: 0.7219, OV: 0.1052, AltV: 0.1191, CorV: 0.0843, TopV: 0.1024, BotRV: 0.0748, AllV: 0.1191 +[2026-01-29T21:26:29.186680Z] Loop 26: Reg: 0.6980, AltReg: 0.7105, CorReg: 0.6792, TopReg: 0.6934, AllReg: 0.7105, BotRReg: 0.7226, OV: 0.1058, AltV: 0.1191, CorV: 0.0859, TopV: 0.1032, BotRV: 0.0741, AllV: 0.1191 +[2026-01-29T21:26:30.391508Z] Loop 27: Reg: 0.6973, AltReg: 0.7105, CorReg: 0.6775, TopReg: 0.6925, AllReg: 0.7105, BotRReg: 0.7233, OV: 0.1065, AltV: 0.1191, CorV: 0.0876, TopV: 0.1041, BotRV: 0.0733, AllV: 0.1191 +[2026-01-29T21:26:31.597513Z] Loop 28: Reg: 0.6966, AltReg: 0.7105, CorReg: 0.6757, TopReg: 0.6916, AllReg: 0.7105, BotRReg: 0.7241, OV: 0.1072, AltV: 0.1190, CorV: 0.0894, TopV: 0.1051, BotRV: 0.0726, AllV: 0.1190 +[2026-01-29T21:26:32.799287Z] Loop 29: Reg: 0.6959, AltReg: 0.7106, CorReg: 0.6738, TopReg: 0.6906, AllReg: 0.7106, BotRReg: 0.7249, OV: 0.1079, AltV: 0.1190, CorV: 0.0914, TopV: 0.1061, BotRV: 0.0718, AllV: 0.1190 +[2026-01-29T21:26:34.003398Z] Loop 30: Reg: 0.6951, AltReg: 0.7106, CorReg: 0.6717, TopReg: 0.6895, AllReg: 0.7106, BotRReg: 0.7258, OV: 0.1087, AltV: 0.1189, CorV: 0.0934, TopV: 0.1072, BotRV: 0.0709, AllV: 0.1189 +[2026-01-29T21:26:35.208169Z] Loop 31: Reg: 0.6942, AltReg: 0.7107, CorReg: 0.6694, TopReg: 0.6884, AllReg: 0.7107, BotRReg: 0.7267, OV: 0.1096, AltV: 0.1188, CorV: 0.0957, TopV: 0.1083, BotRV: 0.0700, AllV: 0.1188 +[2026-01-29T21:26:36.413283Z] Loop 32: Reg: 0.6933, AltReg: 0.7108, CorReg: 0.6670, TopReg: 0.6872, AllReg: 0.7108, BotRReg: 0.7276, OV: 0.1105, AltV: 0.1188, CorV: 0.0981, TopV: 0.1095, BotRV: 0.0691, AllV: 0.1188 +[2026-01-29T21:26:37.617935Z] Loop 33: Reg: 0.6923, AltReg: 0.7109, CorReg: 0.6644, TopReg: 0.6860, AllReg: 0.7109, BotRReg: 0.7286, OV: 0.1115, AltV: 0.1187, CorV: 0.1008, TopV: 0.1107, BotRV: 0.0681, AllV: 0.1187 +[2026-01-29T21:26:38.820086Z] Loop 34: Reg: 0.6912, AltReg: 0.7109, CorReg: 0.6616, TopReg: 0.6847, AllReg: 0.7109, BotRReg: 0.7296, OV: 0.1126, AltV: 0.1186, CorV: 0.1035, TopV: 0.1120, BotRV: 0.0671, AllV: 0.1186 +[2026-01-29T21:26:40.022859Z] Loop 35: Reg: 0.6901, AltReg: 0.7110, CorReg: 0.6587, TopReg: 0.6833, AllReg: 0.7110, BotRReg: 0.7306, OV: 0.1137, AltV: 0.1185, CorV: 0.1064, TopV: 0.1134, BotRV: 0.0661, AllV: 0.1185 +[2026-01-29T21:26:41.227529Z] Loop 36: Reg: 0.6889, AltReg: 0.7111, CorReg: 0.6556, TopReg: 0.6819, AllReg: 0.7111, BotRReg: 0.7316, OV: 0.1149, AltV: 0.1184, CorV: 0.1096, TopV: 0.1148, BotRV: 0.0650, AllV: 0.1184 +[2026-01-29T21:26:42.433001Z] Loop 37: Reg: 0.6876, AltReg: 0.7113, CorReg: 0.6522, TopReg: 0.6804, AllReg: 0.7113, BotRReg: 0.7327, OV: 0.1161, AltV: 0.1183, CorV: 0.1129, TopV: 0.1162, BotRV: 0.0640, AllV: 0.1183 +[2026-01-29T21:26:43.636700Z] Loop 38: Reg: 0.6863, AltReg: 0.7114, CorReg: 0.6486, TopReg: 0.6788, AllReg: 0.7114, BotRReg: 0.7339, OV: 0.1175, AltV: 0.1182, CorV: 0.1166, TopV: 0.1179, BotRV: 0.0628, AllV: 0.1182 +[2026-01-29T21:26:44.838040Z] Loop 39: Reg: 0.6848, AltReg: 0.7115, CorReg: 0.6446, TopReg: 0.6771, AllReg: 0.7115, BotRReg: 0.7351, OV: 0.1190, AltV: 0.1180, CorV: 0.1205, TopV: 0.1196, BotRV: 0.0616, AllV: 0.1180 +[2026-01-29T21:26:46.040976Z] Loop 40: Reg: 0.6831, AltReg: 0.7117, CorReg: 0.6403, TopReg: 0.6753, AllReg: 0.7117, BotRReg: 0.7364, OV: 0.1206, AltV: 0.1178, CorV: 0.1248, TopV: 0.1214, BotRV: 0.0603, AllV: 0.1178 +[2026-01-29T21:26:47.243824Z] Loop 41: Reg: 0.6814, AltReg: 0.7119, CorReg: 0.6356, TopReg: 0.6733, AllReg: 0.7119, BotRReg: 0.7378, OV: 0.1224, AltV: 0.1176, CorV: 0.1295, TopV: 0.1234, BotRV: 0.0589, AllV: 0.1176 +[2026-01-29T21:26:48.445155Z] Loop 42: Reg: 0.6795, AltReg: 0.7121, CorReg: 0.6305, TopReg: 0.6712, AllReg: 0.7121, BotRReg: 0.7392, OV: 0.1243, AltV: 0.1174, CorV: 0.1347, TopV: 0.1255, BotRV: 0.0575, AllV: 0.1174 +[2026-01-29T21:26:49.648640Z] Loop 43: Reg: 0.6773, AltReg: 0.7124, CorReg: 0.6248, TopReg: 0.6689, AllReg: 0.7124, BotRReg: 0.7407, OV: 0.1264, AltV: 0.1172, CorV: 0.1403, TopV: 0.1278, BotRV: 0.0560, AllV: 0.1172 +[2026-01-29T21:26:50.850577Z] Loop 44: Reg: 0.6750, AltReg: 0.7127, CorReg: 0.6186, TopReg: 0.6665, AllReg: 0.7127, BotRReg: 0.7422, OV: 0.1288, AltV: 0.1169, CorV: 0.1466, TopV: 0.1302, BotRV: 0.0544, AllV: 0.1169 +[2026-01-29T21:26:52.051244Z] Loop 45: Reg: 0.6725, AltReg: 0.7130, CorReg: 0.6118, TopReg: 0.6639, AllReg: 0.7130, BotRReg: 0.7439, OV: 0.1313, AltV: 0.1166, CorV: 0.1534, TopV: 0.1328, BotRV: 0.0528, AllV: 0.1166 +[2026-01-29T21:26:53.254830Z] Loop 46: Reg: 0.6697, AltReg: 0.7133, CorReg: 0.6043, TopReg: 0.6611, AllReg: 0.7133, BotRReg: 0.7456, OV: 0.1341, AltV: 0.1162, CorV: 0.1608, TopV: 0.1356, BotRV: 0.0511, AllV: 0.1162 +[2026-01-29T21:26:54.456976Z] Loop 47: Reg: 0.6667, AltReg: 0.7137, CorReg: 0.5961, TopReg: 0.6581, AllReg: 0.7137, BotRReg: 0.7473, OV: 0.1371, AltV: 0.1158, CorV: 0.1690, TopV: 0.1386, BotRV: 0.0493, AllV: 0.1158 +[2026-01-29T21:26:55.660189Z] Loop 48: Reg: 0.6634, AltReg: 0.7142, CorReg: 0.5872, TopReg: 0.6549, AllReg: 0.7142, BotRReg: 0.7492, OV: 0.1404, AltV: 0.1154, CorV: 0.1779, TopV: 0.1417, BotRV: 0.0475, AllV: 0.1154 +[2026-01-29T21:26:56.864342Z] Loop 49: Reg: 0.6598, AltReg: 0.7147, CorReg: 0.5775, TopReg: 0.6515, AllReg: 0.7147, BotRReg: 0.7511, OV: 0.1440, AltV: 0.1149, CorV: 0.1876, TopV: 0.1452, BotRV: 0.0456, AllV: 0.1149 +[2026-01-29T21:26:58.066572Z] Loop 50: Reg: 0.6559, AltReg: 0.7153, CorReg: 0.5667, TopReg: 0.6479, AllReg: 0.7153, BotRReg: 0.7531, OV: 0.1479, AltV: 0.1143, CorV: 0.1984, TopV: 0.1488, BotRV: 0.0436, AllV: 0.1143 +[2026-01-29T21:26:59.271708Z] Loop 51: Reg: 0.6516, AltReg: 0.7159, CorReg: 0.5550, TopReg: 0.6440, AllReg: 0.7159, BotRReg: 0.7551, OV: 0.1522, AltV: 0.1136, CorV: 0.2101, TopV: 0.1526, BotRV: 0.0416, AllV: 0.1136 +[2026-01-29T21:27:00.473907Z] Loop 52: Reg: 0.6469, AltReg: 0.7167, CorReg: 0.5422, TopReg: 0.6400, AllReg: 0.7167, BotRReg: 0.7571, OV: 0.1569, AltV: 0.1129, CorV: 0.2229, TopV: 0.1567, BotRV: 0.0396, AllV: 0.1129 +[2026-01-29T21:27:01.675493Z] Loop 53: Reg: 0.6418, AltReg: 0.7175, CorReg: 0.5283, TopReg: 0.6358, AllReg: 0.7175, BotRReg: 0.7592, OV: 0.1620, AltV: 0.1120, CorV: 0.2368, TopV: 0.1609, BotRV: 0.0375, AllV: 0.1120 +[2026-01-29T21:27:02.877973Z] Loop 54: Reg: 0.6363, AltReg: 0.7185, CorReg: 0.5131, TopReg: 0.6314, AllReg: 0.7185, BotRReg: 0.7613, OV: 0.1674, AltV: 0.1111, CorV: 0.2520, TopV: 0.1653, BotRV: 0.0354, AllV: 0.1111 +[2026-01-29T21:27:04.083290Z] Loop 55: Reg: 0.6305, AltReg: 0.7195, CorReg: 0.4969, TopReg: 0.6269, AllReg: 0.7195, BotRReg: 0.7634, OV: 0.1733, AltV: 0.1101, CorV: 0.2682, TopV: 0.1698, BotRV: 0.0333, AllV: 0.1101 +[2026-01-29T21:27:05.286178Z] Loop 56: Reg: 0.6242, AltReg: 0.7206, CorReg: 0.4796, TopReg: 0.6222, AllReg: 0.7206, BotRReg: 0.7655, OV: 0.1796, AltV: 0.1089, CorV: 0.2855, TopV: 0.1745, BotRV: 0.0312, AllV: 0.1089 +[2026-01-29T21:27:06.488370Z] Loop 57: Reg: 0.6176, AltReg: 0.7219, CorReg: 0.4612, TopReg: 0.6176, AllReg: 0.7219, BotRReg: 0.7675, OV: 0.1861, AltV: 0.1076, CorV: 0.3039, TopV: 0.1791, BotRV: 0.0292, AllV: 0.1076 +[2026-01-29T21:27:07.689996Z] Loop 58: Reg: 0.6107, AltReg: 0.7233, CorReg: 0.4419, TopReg: 0.6128, AllReg: 0.7233, BotRReg: 0.7695, OV: 0.1931, AltV: 0.1063, CorV: 0.3233, TopV: 0.1838, BotRV: 0.0272, AllV: 0.1063 +[2026-01-29T21:27:08.895199Z] Loop 59: Reg: 0.6035, AltReg: 0.7248, CorReg: 0.4216, TopReg: 0.6081, AllReg: 0.7248, BotRReg: 0.7714, OV: 0.2003, AltV: 0.1048, CorV: 0.3435, TopV: 0.1885, BotRV: 0.0253, AllV: 0.1048 +[2026-01-29T21:27:10.099374Z] Loop 60: Reg: 0.5961, AltReg: 0.7264, CorReg: 0.4006, TopReg: 0.6036, AllReg: 0.7264, BotRReg: 0.7733, OV: 0.2077, AltV: 0.1031, CorV: 0.3645, TopV: 0.1931, BotRV: 0.0234, AllV: 0.1031 +[2026-01-29T21:27:11.302073Z] Loop 61: Reg: 0.5886, AltReg: 0.7281, CorReg: 0.3792, TopReg: 0.5991, AllReg: 0.7281, BotRReg: 0.7750, OV: 0.2152, AltV: 0.1014, CorV: 0.3859, TopV: 0.1975, BotRV: 0.0217, AllV: 0.1014 +[2026-01-29T21:27:12.503905Z] Loop 62: Reg: 0.5810, AltReg: 0.7299, CorReg: 0.3576, TopReg: 0.5949, AllReg: 0.7299, BotRReg: 0.7767, OV: 0.2228, AltV: 0.0996, CorV: 0.4076, TopV: 0.2018, BotRV: 0.0200, AllV: 0.0996 +[2026-01-29T21:27:13.708153Z] Loop 63: Reg: 0.5735, AltReg: 0.7318, CorReg: 0.3360, TopReg: 0.5907, AllReg: 0.7318, BotRReg: 0.7783, OV: 0.2303, AltV: 0.0978, CorV: 0.4291, TopV: 0.2060, BotRV: 0.0184, AllV: 0.0978 +[2026-01-29T21:27:14.912291Z] Loop 64: Reg: 0.5661, AltReg: 0.7337, CorReg: 0.3146, TopReg: 0.5869, AllReg: 0.7337, BotRReg: 0.7798, OV: 0.2377, AltV: 0.0958, CorV: 0.4505, TopV: 0.2098, BotRV: 0.0169, AllV: 0.0958 +[2026-01-29T21:27:16.114738Z] Loop 65: Reg: 0.5589, AltReg: 0.7357, CorReg: 0.2938, TopReg: 0.5832, AllReg: 0.7357, BotRReg: 0.7811, OV: 0.2448, AltV: 0.0938, CorV: 0.4714, TopV: 0.2135, BotRV: 0.0155, AllV: 0.0938 +[2026-01-29T21:27:17.318455Z] Loop 66: Reg: 0.5521, AltReg: 0.7377, CorReg: 0.2736, TopReg: 0.5799, AllReg: 0.7377, BotRReg: 0.7824, OV: 0.2517, AltV: 0.0918, CorV: 0.4915, TopV: 0.2168, BotRV: 0.0143, AllV: 0.0918 +[2026-01-29T21:27:18.521941Z] Loop 67: Reg: 0.5456, AltReg: 0.7397, CorReg: 0.2545, TopReg: 0.5770, AllReg: 0.7397, BotRReg: 0.7835, OV: 0.2581, AltV: 0.0899, CorV: 0.5106, TopV: 0.2197, BotRV: 0.0131, AllV: 0.0899 +[2026-01-29T21:27:19.724576Z] Loop 68: Reg: 0.5397, AltReg: 0.7416, CorReg: 0.2368, TopReg: 0.5746, AllReg: 0.7416, BotRReg: 0.7845, OV: 0.2641, AltV: 0.0880, CorV: 0.5283, TopV: 0.2221, BotRV: 0.0122, AllV: 0.0880 +[2026-01-29T21:27:20.929819Z] Loop 69: Reg: 0.5342, AltReg: 0.7434, CorReg: 0.2203, TopReg: 0.5725, AllReg: 0.7434, BotRReg: 0.7854, OV: 0.2696, AltV: 0.0861, CorV: 0.5448, TopV: 0.2242, BotRV: 0.0113, AllV: 0.0861 +[2026-01-29T21:27:22.136806Z] Loop 70: Reg: 0.5292, AltReg: 0.7452, CorReg: 0.2051, TopReg: 0.5708, AllReg: 0.7452, BotRReg: 0.7862, OV: 0.2746, AltV: 0.0844, CorV: 0.5600, TopV: 0.2259, BotRV: 0.0105, AllV: 0.0844 +[2026-01-29T21:27:23.339339Z] Loop 71: Reg: 0.5246, AltReg: 0.7468, CorReg: 0.1914, TopReg: 0.5696, AllReg: 0.7468, BotRReg: 0.7869, OV: 0.2791, AltV: 0.0828, CorV: 0.5737, TopV: 0.2271, BotRV: 0.0098, AllV: 0.0828 +[2026-01-29T21:27:24.543996Z] Loop 72: Reg: 0.5206, AltReg: 0.7483, CorReg: 0.1790, TopReg: 0.5686, AllReg: 0.7483, BotRReg: 0.7874, OV: 0.2832, AltV: 0.0812, CorV: 0.5861, TopV: 0.2281, BotRV: 0.0093, AllV: 0.0812 +[2026-01-29T21:27:25.750089Z] Loop 73: Reg: 0.5170, AltReg: 0.7497, CorReg: 0.1679, TopReg: 0.5680, AllReg: 0.7497, BotRReg: 0.7879, OV: 0.2868, AltV: 0.0798, CorV: 0.5972, TopV: 0.2287, BotRV: 0.0088, AllV: 0.0798 +[2026-01-29T21:27:26.952988Z] Loop 74: Reg: 0.5138, AltReg: 0.7510, CorReg: 0.1580, TopReg: 0.5676, AllReg: 0.7510, BotRReg: 0.7884, OV: 0.2900, AltV: 0.0786, CorV: 0.6071, TopV: 0.2290, BotRV: 0.0083, AllV: 0.0786 +[2026-01-29T21:27:28.158552Z] Loop 75: Reg: 0.5110, AltReg: 0.7521, CorReg: 0.1493, TopReg: 0.5674, AllReg: 0.7521, BotRReg: 0.7887, OV: 0.2928, AltV: 0.0774, CorV: 0.6159, TopV: 0.2293, BotRV: 0.0080, AllV: 0.0774 +[2026-01-29T21:27:29.363624Z] Loop 76: Reg: 0.5085, AltReg: 0.7532, CorReg: 0.1415, TopReg: 0.5676, AllReg: 0.7532, BotRReg: 0.7890, OV: 0.2953, AltV: 0.0764, CorV: 0.6236, TopV: 0.2291, BotRV: 0.0077, AllV: 0.0764 +[2026-01-29T21:27:30.567021Z] Loop 77: Reg: 0.5063, AltReg: 0.7541, CorReg: 0.1346, TopReg: 0.5682, AllReg: 0.7541, BotRReg: 0.7892, OV: 0.2975, AltV: 0.0755, CorV: 0.6305, TopV: 0.2285, BotRV: 0.0074, AllV: 0.0755 +[2026-01-29T21:27:31.771203Z] Loop 78: Reg: 0.5044, AltReg: 0.7549, CorReg: 0.1286, TopReg: 0.5691, AllReg: 0.7549, BotRReg: 0.7894, OV: 0.2994, AltV: 0.0747, CorV: 0.6365, TopV: 0.2275, BotRV: 0.0073, AllV: 0.0747 +[2026-01-29T21:27:32.975244Z] Loop 79: Reg: 0.5027, AltReg: 0.7556, CorReg: 0.1233, TopReg: 0.5704, AllReg: 0.7556, BotRReg: 0.7895, OV: 0.3011, AltV: 0.0740, CorV: 0.6418, TopV: 0.2263, BotRV: 0.0072, AllV: 0.0740 +[2026-01-29T21:27:34.179882Z] Loop 80: Reg: 0.5012, AltReg: 0.7562, CorReg: 0.1187, TopReg: 0.5721, AllReg: 0.7562, BotRReg: 0.7896, OV: 0.3026, AltV: 0.0733, CorV: 0.6464, TopV: 0.2246, BotRV: 0.0071, AllV: 0.0733 +[2026-01-29T21:27:35.418634Z] Loop 81: Reg: 0.4999, AltReg: 0.7568, CorReg: 0.1145, TopReg: 0.5741, AllReg: 0.7568, BotRReg: 0.7896, OV: 0.3039, AltV: 0.0728, CorV: 0.6506, TopV: 0.2226, BotRV: 0.0071, AllV: 0.0728 +[2026-01-29T21:27:36.622422Z] Loop 82: Reg: 0.4987, AltReg: 0.7573, CorReg: 0.1109, TopReg: 0.5763, AllReg: 0.7573, BotRReg: 0.7896, OV: 0.3050, AltV: 0.0723, CorV: 0.6542, TopV: 0.2204, BotRV: 0.0071, AllV: 0.0723 +[2026-01-29T21:27:37.829500Z] Loop 83: Reg: 0.4978, AltReg: 0.7577, CorReg: 0.1079, TopReg: 0.5788, AllReg: 0.7577, BotRReg: 0.7896, OV: 0.3060, AltV: 0.0718, CorV: 0.6573, TopV: 0.2179, BotRV: 0.0071, AllV: 0.0718 +[2026-01-29T21:27:39.032202Z] Loop 84: Reg: 0.4970, AltReg: 0.7581, CorReg: 0.1054, TopReg: 0.5813, AllReg: 0.7581, BotRReg: 0.7895, OV: 0.3068, AltV: 0.0714, CorV: 0.6598, TopV: 0.2154, BotRV: 0.0072, AllV: 0.0714 +[2026-01-29T21:27:40.242964Z] Loop 85: Reg: 0.4964, AltReg: 0.7585, CorReg: 0.1034, TopReg: 0.5839, AllReg: 0.7585, BotRReg: 0.7894, OV: 0.3073, AltV: 0.0711, CorV: 0.6617, TopV: 0.2128, BotRV: 0.0073, AllV: 0.0711 +[2026-01-29T21:27:41.446500Z] Loop 86: Reg: 0.4960, AltReg: 0.7588, CorReg: 0.1018, TopReg: 0.5865, AllReg: 0.7588, BotRReg: 0.7893, OV: 0.3078, AltV: 0.0708, CorV: 0.6633, TopV: 0.2102, BotRV: 0.0074, AllV: 0.0708 +[2026-01-29T21:27:42.649644Z] Loop 87: Reg: 0.4957, AltReg: 0.7590, CorReg: 0.1007, TopReg: 0.5892, AllReg: 0.7590, BotRReg: 0.7892, OV: 0.3081, AltV: 0.0705, CorV: 0.6644, TopV: 0.2075, BotRV: 0.0075, AllV: 0.0705 +[2026-01-29T21:27:43.852254Z] Loop 88: Reg: 0.4955, AltReg: 0.7593, CorReg: 0.0999, TopReg: 0.5922, AllReg: 0.7593, BotRReg: 0.7890, OV: 0.3082, AltV: 0.0703, CorV: 0.6652, TopV: 0.2045, BotRV: 0.0076, AllV: 0.0703 +[2026-01-29T21:27:45.056790Z] Loop 89: Reg: 0.4954, AltReg: 0.7595, CorReg: 0.0993, TopReg: 0.5940, AllReg: 0.7595, BotRReg: 0.7890, OV: 0.3084, AltV: 0.0701, CorV: 0.6658, TopV: 0.2027, BotRV: 0.0077, AllV: 0.0701 +[2026-01-29T21:27:46.263003Z] Loop 90: Reg: 0.4952, AltReg: 0.7597, CorReg: 0.0985, TopReg: 0.5949, AllReg: 0.7597, BotRReg: 0.7890, OV: 0.3086, AltV: 0.0699, CorV: 0.6666, TopV: 0.2018, BotRV: 0.0077, AllV: 0.0699 +[2026-01-29T21:27:47.466115Z] Loop 91: Reg: 0.4950, AltReg: 0.7598, CorReg: 0.0977, TopReg: 0.5950, AllReg: 0.7598, BotRReg: 0.7890, OV: 0.3088, AltV: 0.0697, CorV: 0.6674, TopV: 0.2017, BotRV: 0.0077, AllV: 0.0697 +[2026-01-29T21:27:48.671434Z] Loop 92: Reg: 0.4947, AltReg: 0.7599, CorReg: 0.0968, TopReg: 0.5942, AllReg: 0.7599, BotRReg: 0.7891, OV: 0.3091, AltV: 0.0696, CorV: 0.6683, TopV: 0.2025, BotRV: 0.0076, AllV: 0.0696 +[2026-01-29T21:27:49.884567Z] Loop 93: Reg: 0.4944, AltReg: 0.7600, CorReg: 0.0959, TopReg: 0.5928, AllReg: 0.7600, BotRReg: 0.7893, OV: 0.3094, AltV: 0.0695, CorV: 0.6692, TopV: 0.2039, BotRV: 0.0074, AllV: 0.0695 +[2026-01-29T21:27:51.090562Z] Loop 94: Reg: 0.4941, AltReg: 0.7601, CorReg: 0.0951, TopReg: 0.5907, AllReg: 0.7601, BotRReg: 0.7895, OV: 0.3097, AltV: 0.0694, CorV: 0.6701, TopV: 0.2060, BotRV: 0.0072, AllV: 0.0694 +[2026-01-29T21:27:52.294572Z] Loop 95: Reg: 0.4939, AltReg: 0.7602, CorReg: 0.0944, TopReg: 0.5887, AllReg: 0.7602, BotRReg: 0.7896, OV: 0.3099, AltV: 0.0693, CorV: 0.6707, TopV: 0.2080, BotRV: 0.0071, AllV: 0.0693 +[2026-01-29T21:27:53.500308Z] Loop 96: Reg: 0.4937, AltReg: 0.7603, CorReg: 0.0940, TopReg: 0.5858, AllReg: 0.7603, BotRReg: 0.7899, OV: 0.3100, AltV: 0.0693, CorV: 0.6712, TopV: 0.2109, BotRV: 0.0068, AllV: 0.0693 +[2026-01-29T21:27:54.703286Z] Loop 97: Reg: 0.4937, AltReg: 0.7603, CorReg: 0.0938, TopReg: 0.5823, AllReg: 0.7603, BotRReg: 0.7901, OV: 0.3100, AltV: 0.0692, CorV: 0.6713, TopV: 0.2144, BotRV: 0.0066, AllV: 0.0692 +[2026-01-29T21:27:55.907615Z] Loop 98: Reg: 0.4939, AltReg: 0.7604, CorReg: 0.0941, TopReg: 0.5788, AllReg: 0.7604, BotRReg: 0.7904, OV: 0.3099, AltV: 0.0692, CorV: 0.6711, TopV: 0.2179, BotRV: 0.0063, AllV: 0.0692 +[2026-01-29T21:27:57.112856Z] Loop 99: Reg: 0.4941, AltReg: 0.7605, CorReg: 0.0944, TopReg: 0.5761, AllReg: 0.7605, BotRReg: 0.7906, OV: 0.3097, AltV: 0.0691, CorV: 0.6707, TopV: 0.2206, BotRV: 0.0061, AllV: 0.0691 +[2026-01-29T21:27:58.315872Z] Loop 100: Reg: 0.4943, AltReg: 0.7605, CorReg: 0.0949, TopReg: 0.5739, AllReg: 0.7605, BotRReg: 0.7907, OV: 0.3095, AltV: 0.0690, CorV: 0.6703, TopV: 0.2228, BotRV: 0.0060, AllV: 0.0690 +[2026-01-29T21:27:59.519888Z] Loop 101: Reg: 0.4943, AltReg: 0.7606, CorReg: 0.0949, TopReg: 0.5733, AllReg: 0.7606, BotRReg: 0.7908, OV: 0.3095, AltV: 0.0690, CorV: 0.6702, TopV: 0.2234, BotRV: 0.0059, AllV: 0.0690 +[2026-01-29T21:28:00.725127Z] Loop 102: Reg: 0.4942, AltReg: 0.7606, CorReg: 0.0945, TopReg: 0.5740, AllReg: 0.7606, BotRReg: 0.7907, OV: 0.3096, AltV: 0.0689, CorV: 0.6706, TopV: 0.2227, BotRV: 0.0059, AllV: 0.0689 +[2026-01-29T21:28:01.933131Z] Loop 103: Reg: 0.4940, AltReg: 0.7606, CorReg: 0.0939, TopReg: 0.5755, AllReg: 0.7606, BotRReg: 0.7907, OV: 0.3098, AltV: 0.0689, CorV: 0.6712, TopV: 0.2212, BotRV: 0.0060, AllV: 0.0689 +[2026-01-29T21:28:03.141240Z] Loop 104: Reg: 0.4937, AltReg: 0.7607, CorReg: 0.0933, TopReg: 0.5775, AllReg: 0.7607, BotRReg: 0.7905, OV: 0.3101, AltV: 0.0689, CorV: 0.6718, TopV: 0.2192, BotRV: 0.0062, AllV: 0.0689 +[2026-01-29T21:28:04.344586Z] Loop 105: Reg: 0.4935, AltReg: 0.7607, CorReg: 0.0927, TopReg: 0.5801, AllReg: 0.7607, BotRReg: 0.7904, OV: 0.3103, AltV: 0.0689, CorV: 0.6724, TopV: 0.2166, BotRV: 0.0063, AllV: 0.0689 +[2026-01-29T21:28:05.546890Z] Loop 106: Reg: 0.4933, AltReg: 0.7607, CorReg: 0.0923, TopReg: 0.5837, AllReg: 0.7607, BotRReg: 0.7901, OV: 0.3105, AltV: 0.0689, CorV: 0.6728, TopV: 0.2130, BotRV: 0.0066, AllV: 0.0689 +[2026-01-29T21:28:06.750253Z] Loop 107: Reg: 0.4933, AltReg: 0.7607, CorReg: 0.0921, TopReg: 0.5871, AllReg: 0.7607, BotRReg: 0.7899, OV: 0.3105, AltV: 0.0689, CorV: 0.6730, TopV: 0.2096, BotRV: 0.0068, AllV: 0.0689 +[2026-01-29T21:28:07.955378Z] Loop 108: Reg: 0.4933, AltReg: 0.7607, CorReg: 0.0923, TopReg: 0.5903, AllReg: 0.7607, BotRReg: 0.7897, OV: 0.3104, AltV: 0.0689, CorV: 0.6728, TopV: 0.2064, BotRV: 0.0070, AllV: 0.0689 +[2026-01-29T21:28:09.165266Z] Loop 109: Reg: 0.4934, AltReg: 0.7607, CorReg: 0.0925, TopReg: 0.5925, AllReg: 0.7607, BotRReg: 0.7895, OV: 0.3103, AltV: 0.0688, CorV: 0.6726, TopV: 0.2042, BotRV: 0.0072, AllV: 0.0688 +[2026-01-29T21:28:10.370826Z] Loop 110: Reg: 0.4936, AltReg: 0.7607, CorReg: 0.0928, TopReg: 0.5945, AllReg: 0.7607, BotRReg: 0.7894, OV: 0.3102, AltV: 0.0688, CorV: 0.6723, TopV: 0.2022, BotRV: 0.0073, AllV: 0.0688 +[2026-01-29T21:28:11.572986Z] Loop 111: Reg: 0.4937, AltReg: 0.7608, CorReg: 0.0931, TopReg: 0.5959, AllReg: 0.7608, BotRReg: 0.7893, OV: 0.3101, AltV: 0.0688, CorV: 0.6720, TopV: 0.2008, BotRV: 0.0074, AllV: 0.0688 +[2026-01-29T21:28:12.774338Z] Loop 112: Reg: 0.4938, AltReg: 0.7608, CorReg: 0.0933, TopReg: 0.5969, AllReg: 0.7608, BotRReg: 0.7892, OV: 0.3100, AltV: 0.0688, CorV: 0.6718, TopV: 0.1998, BotRV: 0.0075, AllV: 0.0688 +[2026-01-29T21:28:13.978133Z] Loop 113: Reg: 0.4939, AltReg: 0.7608, CorReg: 0.0937, TopReg: 0.5981, AllReg: 0.7608, BotRReg: 0.7891, OV: 0.3098, AltV: 0.0688, CorV: 0.6715, TopV: 0.1986, BotRV: 0.0076, AllV: 0.0688 +[2026-01-29T21:28:15.179971Z] Loop 114: Reg: 0.4940, AltReg: 0.7608, CorReg: 0.0937, TopReg: 0.5983, AllReg: 0.7608, BotRReg: 0.7891, OV: 0.3098, AltV: 0.0687, CorV: 0.6714, TopV: 0.1984, BotRV: 0.0076, AllV: 0.0687 +[2026-01-29T21:28:16.383586Z] Loop 115: Reg: 0.4939, AltReg: 0.7608, CorReg: 0.0935, TopReg: 0.5979, AllReg: 0.7608, BotRReg: 0.7891, OV: 0.3099, AltV: 0.0687, CorV: 0.6716, TopV: 0.1988, BotRV: 0.0076, AllV: 0.0687 +[2026-01-29T21:28:17.585056Z] Loop 116: Reg: 0.4939, AltReg: 0.7608, CorReg: 0.0935, TopReg: 0.5981, AllReg: 0.7608, BotRReg: 0.7891, OV: 0.3099, AltV: 0.0687, CorV: 0.6716, TopV: 0.1985, BotRV: 0.0076, AllV: 0.0687 +[2026-01-29T21:28:18.787705Z] Loop 117: Reg: 0.4937, AltReg: 0.7608, CorReg: 0.0931, TopReg: 0.5968, AllReg: 0.7608, BotRReg: 0.7892, OV: 0.3101, AltV: 0.0687, CorV: 0.6720, TopV: 0.1999, BotRV: 0.0075, AllV: 0.0687 +[2026-01-29T21:28:19.991657Z] Loop 118: Reg: 0.4936, AltReg: 0.7608, CorReg: 0.0927, TopReg: 0.5955, AllReg: 0.7608, BotRReg: 0.7893, OV: 0.3102, AltV: 0.0687, CorV: 0.6724, TopV: 0.2012, BotRV: 0.0074, AllV: 0.0687 +[2026-01-29T21:28:21.194618Z] Loop 119: Reg: 0.4934, AltReg: 0.7608, CorReg: 0.0922, TopReg: 0.5933, AllReg: 0.7608, BotRReg: 0.7895, OV: 0.3104, AltV: 0.0687, CorV: 0.6729, TopV: 0.2034, BotRV: 0.0072, AllV: 0.0687 +[2026-01-29T21:28:22.397478Z] Loop 120: Reg: 0.4932, AltReg: 0.7608, CorReg: 0.0918, TopReg: 0.5902, AllReg: 0.7608, BotRReg: 0.7897, OV: 0.3106, AltV: 0.0688, CorV: 0.6733, TopV: 0.2064, BotRV: 0.0070, AllV: 0.0688 +[2026-01-29T21:28:23.599736Z] Loop 121: Reg: 0.4931, AltReg: 0.7608, CorReg: 0.0916, TopReg: 0.5866, AllReg: 0.7608, BotRReg: 0.7900, OV: 0.3107, AltV: 0.0688, CorV: 0.6735, TopV: 0.2101, BotRV: 0.0067, AllV: 0.0688 +[2026-01-29T21:28:24.803540Z] Loop 122: Reg: 0.4932, AltReg: 0.7608, CorReg: 0.0917, TopReg: 0.5826, AllReg: 0.7608, BotRReg: 0.7902, OV: 0.3106, AltV: 0.0687, CorV: 0.6734, TopV: 0.2141, BotRV: 0.0065, AllV: 0.0687 +[2026-01-29T21:28:26.004993Z] Loop 123: Reg: 0.4934, AltReg: 0.7608, CorReg: 0.0922, TopReg: 0.5791, AllReg: 0.7608, BotRReg: 0.7905, OV: 0.3104, AltV: 0.0687, CorV: 0.6729, TopV: 0.2176, BotRV: 0.0062, AllV: 0.0687 +[2026-01-29T21:28:27.205986Z] Loop 124: Reg: 0.4937, AltReg: 0.7609, CorReg: 0.0929, TopReg: 0.5761, AllReg: 0.7609, BotRReg: 0.7907, OV: 0.3101, AltV: 0.0687, CorV: 0.6722, TopV: 0.2206, BotRV: 0.0060, AllV: 0.0687 +[2026-01-29T21:28:28.409388Z] Loop 125: Reg: 0.4940, AltReg: 0.7609, CorReg: 0.0937, TopReg: 0.5734, AllReg: 0.7609, BotRReg: 0.7908, OV: 0.3098, AltV: 0.0687, CorV: 0.6714, TopV: 0.2232, BotRV: 0.0059, AllV: 0.0687 +[2026-01-29T21:28:29.613798Z] Loop 126: Reg: 0.4941, AltReg: 0.7609, CorReg: 0.0939, TopReg: 0.5729, AllReg: 0.7609, BotRReg: 0.7909, OV: 0.3097, AltV: 0.0687, CorV: 0.6712, TopV: 0.2238, BotRV: 0.0058, AllV: 0.0687 +[2026-01-29T21:28:30.817957Z] Loop 127: Reg: 0.4941, AltReg: 0.7609, CorReg: 0.0938, TopReg: 0.5730, AllReg: 0.7609, BotRReg: 0.7909, OV: 0.3097, AltV: 0.0687, CorV: 0.6713, TopV: 0.2237, BotRV: 0.0058, AllV: 0.0687 +[2026-01-29T21:28:32.021857Z] Loop 128: Reg: 0.4940, AltReg: 0.7609, CorReg: 0.0936, TopReg: 0.5738, AllReg: 0.7609, BotRReg: 0.7908, OV: 0.3098, AltV: 0.0687, CorV: 0.6716, TopV: 0.2229, BotRV: 0.0059, AllV: 0.0687 +[2026-01-29T21:28:33.226569Z] Loop 129: Reg: 0.4937, AltReg: 0.7609, CorReg: 0.0929, TopReg: 0.5759, AllReg: 0.7609, BotRReg: 0.7907, OV: 0.3101, AltV: 0.0687, CorV: 0.6722, TopV: 0.2207, BotRV: 0.0060, AllV: 0.0687 +[2026-01-29T21:28:34.430251Z] Loop 130: Reg: 0.4934, AltReg: 0.7609, CorReg: 0.0923, TopReg: 0.5784, AllReg: 0.7609, BotRReg: 0.7905, OV: 0.3103, AltV: 0.0687, CorV: 0.6728, TopV: 0.2183, BotRV: 0.0062, AllV: 0.0687 +[2026-01-29T21:28:35.633690Z] Loop 131: Reg: 0.4932, AltReg: 0.7608, CorReg: 0.0917, TopReg: 0.5815, AllReg: 0.7608, BotRReg: 0.7903, OV: 0.3106, AltV: 0.0687, CorV: 0.6734, TopV: 0.2152, BotRV: 0.0064, AllV: 0.0687 +[2026-01-29T21:28:36.836239Z] Loop 132: Reg: 0.4931, AltReg: 0.7608, CorReg: 0.0915, TopReg: 0.5837, AllReg: 0.7608, BotRReg: 0.7902, OV: 0.3107, AltV: 0.0687, CorV: 0.6736, TopV: 0.2130, BotRV: 0.0065, AllV: 0.0687 +[2026-01-29T21:28:38.041539Z] Loop 133: Reg: 0.4931, AltReg: 0.7608, CorReg: 0.0914, TopReg: 0.5864, AllReg: 0.7608, BotRReg: 0.7900, OV: 0.3107, AltV: 0.0687, CorV: 0.6738, TopV: 0.2103, BotRV: 0.0067, AllV: 0.0687 +[2026-01-29T21:28:39.245440Z] Loop 134: Reg: 0.4931, AltReg: 0.7609, CorReg: 0.0914, TopReg: 0.5893, AllReg: 0.7609, BotRReg: 0.7898, OV: 0.3107, AltV: 0.0687, CorV: 0.6737, TopV: 0.2074, BotRV: 0.0069, AllV: 0.0687 +[2026-01-29T21:28:40.451076Z] Loop 135: Reg: 0.4932, AltReg: 0.7609, CorReg: 0.0916, TopReg: 0.5914, AllReg: 0.7609, BotRReg: 0.7896, OV: 0.3106, AltV: 0.0687, CorV: 0.6735, TopV: 0.2053, BotRV: 0.0071, AllV: 0.0687 +[2026-01-29T21:28:41.655174Z] Loop 136: Reg: 0.4933, AltReg: 0.7609, CorReg: 0.0919, TopReg: 0.5936, AllReg: 0.7609, BotRReg: 0.7895, OV: 0.3105, AltV: 0.0687, CorV: 0.6732, TopV: 0.2031, BotRV: 0.0072, AllV: 0.0687 +[2026-01-29T21:28:42.861642Z] Loop 137: Reg: 0.4934, AltReg: 0.7609, CorReg: 0.0922, TopReg: 0.5949, AllReg: 0.7609, BotRReg: 0.7894, OV: 0.3104, AltV: 0.0686, CorV: 0.6730, TopV: 0.2018, BotRV: 0.0073, AllV: 0.0686 +[2026-01-29T21:28:44.067094Z] Loop 138: Reg: 0.4935, AltReg: 0.7609, CorReg: 0.0924, TopReg: 0.5959, AllReg: 0.7609, BotRReg: 0.7893, OV: 0.3103, AltV: 0.0686, CorV: 0.6727, TopV: 0.2008, BotRV: 0.0074, AllV: 0.0686 +[2026-01-29T21:28:45.271796Z] Loop 139: Reg: 0.4936, AltReg: 0.7609, CorReg: 0.0925, TopReg: 0.5966, AllReg: 0.7609, BotRReg: 0.7893, OV: 0.3102, AltV: 0.0686, CorV: 0.6726, TopV: 0.2001, BotRV: 0.0074, AllV: 0.0686 +[2026-01-29T21:28:46.477226Z] Loop 140: Reg: 0.4935, AltReg: 0.7609, CorReg: 0.0923, TopReg: 0.5956, AllReg: 0.7609, BotRReg: 0.7893, OV: 0.3103, AltV: 0.0686, CorV: 0.6728, TopV: 0.2011, BotRV: 0.0074, AllV: 0.0686 +[2026-01-29T21:28:47.681515Z] Loop 141: Reg: 0.4933, AltReg: 0.7609, CorReg: 0.0919, TopReg: 0.5935, AllReg: 0.7609, BotRReg: 0.7895, OV: 0.3105, AltV: 0.0687, CorV: 0.6733, TopV: 0.2032, BotRV: 0.0072, AllV: 0.0687 +[2026-01-29T21:28:48.887352Z] Loop 142: Reg: 0.4931, AltReg: 0.7609, CorReg: 0.0915, TopReg: 0.5909, AllReg: 0.7609, BotRReg: 0.7897, OV: 0.3107, AltV: 0.0687, CorV: 0.6736, TopV: 0.2058, BotRV: 0.0070, AllV: 0.0687 +[2026-01-29T21:28:50.092481Z] Loop 143: Reg: 0.4930, AltReg: 0.7609, CorReg: 0.0913, TopReg: 0.5878, AllReg: 0.7609, BotRReg: 0.7899, OV: 0.3107, AltV: 0.0687, CorV: 0.6738, TopV: 0.2089, BotRV: 0.0068, AllV: 0.0687 +[2026-01-29T21:28:51.299271Z] Loop 144: Reg: 0.4930, AltReg: 0.7609, CorReg: 0.0913, TopReg: 0.5843, AllReg: 0.7609, BotRReg: 0.7901, OV: 0.3107, AltV: 0.0687, CorV: 0.6738, TopV: 0.2123, BotRV: 0.0066, AllV: 0.0687 +[2026-01-29T21:28:52.505304Z] Loop 145: Reg: 0.4931, AltReg: 0.7609, CorReg: 0.0915, TopReg: 0.5823, AllReg: 0.7609, BotRReg: 0.7903, OV: 0.3107, AltV: 0.0687, CorV: 0.6736, TopV: 0.2144, BotRV: 0.0064, AllV: 0.0687 +[2026-01-29T21:28:53.710311Z] Loop 146: Reg: 0.4932, AltReg: 0.7609, CorReg: 0.0916, TopReg: 0.5810, AllReg: 0.7609, BotRReg: 0.7904, OV: 0.3106, AltV: 0.0687, CorV: 0.6735, TopV: 0.2157, BotRV: 0.0063, AllV: 0.0687 +[2026-01-29T21:28:54.925084Z] Loop 147: Reg: 0.4932, AltReg: 0.7609, CorReg: 0.0918, TopReg: 0.5802, AllReg: 0.7609, BotRReg: 0.7904, OV: 0.3105, AltV: 0.0687, CorV: 0.6734, TopV: 0.2164, BotRV: 0.0063, AllV: 0.0687 +[2026-01-29T21:28:56.128278Z] Loop 148: Reg: 0.4932, AltReg: 0.7609, CorReg: 0.0917, TopReg: 0.5804, AllReg: 0.7609, BotRReg: 0.7904, OV: 0.3106, AltV: 0.0687, CorV: 0.6734, TopV: 0.2163, BotRV: 0.0063, AllV: 0.0687 +[2026-01-29T21:28:57.332346Z] Loop 149: Reg: 0.4931, AltReg: 0.7609, CorReg: 0.0915, TopReg: 0.5816, AllReg: 0.7609, BotRReg: 0.7903, OV: 0.3106, AltV: 0.0687, CorV: 0.6736, TopV: 0.2151, BotRV: 0.0064, AllV: 0.0687 +[2026-01-29T21:28:58.540275Z] Loop 150: Reg: 0.4931, AltReg: 0.7609, CorReg: 0.0915, TopReg: 0.5819, AllReg: 0.7609, BotRReg: 0.7903, OV: 0.3107, AltV: 0.0687, CorV: 0.6736, TopV: 0.2148, BotRV: 0.0064, AllV: 0.0687 +[2026-01-29T21:28:59.745408Z] Loop 151: Reg: 0.4931, AltReg: 0.7609, CorReg: 0.0914, TopReg: 0.5818, AllReg: 0.7609, BotRReg: 0.7903, OV: 0.3107, AltV: 0.0687, CorV: 0.6737, TopV: 0.2149, BotRV: 0.0064, AllV: 0.0687 +[2026-01-29T21:29:00.948754Z] Loop 152: Reg: 0.4931, AltReg: 0.7609, CorReg: 0.0914, TopReg: 0.5821, AllReg: 0.7609, BotRReg: 0.7903, OV: 0.3107, AltV: 0.0687, CorV: 0.6737, TopV: 0.2145, BotRV: 0.0064, AllV: 0.0687 +[2026-01-29T21:29:02.155495Z] Loop 153: Reg: 0.4931, AltReg: 0.7609, CorReg: 0.0914, TopReg: 0.5825, AllReg: 0.7609, BotRReg: 0.7903, OV: 0.3107, AltV: 0.0687, CorV: 0.6738, TopV: 0.2142, BotRV: 0.0064, AllV: 0.0687 +[2026-01-29T21:29:03.364116Z] Loop 154: Reg: 0.4930, AltReg: 0.7609, CorReg: 0.0913, TopReg: 0.5836, AllReg: 0.7609, BotRReg: 0.7902, OV: 0.3107, AltV: 0.0687, CorV: 0.6739, TopV: 0.2131, BotRV: 0.0065, AllV: 0.0687 +[2026-01-29T21:29:04.564651Z] Loop 155: Reg: 0.4930, AltReg: 0.7609, CorReg: 0.0912, TopReg: 0.5844, AllReg: 0.7609, BotRReg: 0.7901, OV: 0.3108, AltV: 0.0687, CorV: 0.6739, TopV: 0.2123, BotRV: 0.0065, AllV: 0.0687 +[2026-01-29T21:29:05.765453Z] Loop 156: Reg: 0.4930, AltReg: 0.7609, CorReg: 0.0911, TopReg: 0.5854, AllReg: 0.7609, BotRReg: 0.7901, OV: 0.3108, AltV: 0.0686, CorV: 0.6740, TopV: 0.2113, BotRV: 0.0066, AllV: 0.0686 +[2026-01-29T21:29:06.965827Z] Loop 157: Reg: 0.4930, AltReg: 0.7609, CorReg: 0.0911, TopReg: 0.5871, AllReg: 0.7609, BotRReg: 0.7900, OV: 0.3108, AltV: 0.0686, CorV: 0.6740, TopV: 0.2096, BotRV: 0.0067, AllV: 0.0686 +[2026-01-29T21:29:08.167799Z] Loop 158: Reg: 0.4930, AltReg: 0.7609, CorReg: 0.0911, TopReg: 0.5884, AllReg: 0.7609, BotRReg: 0.7899, OV: 0.3108, AltV: 0.0686, CorV: 0.6740, TopV: 0.2083, BotRV: 0.0068, AllV: 0.0686 +[2026-01-29T21:29:09.367244Z] Loop 159: Reg: 0.4930, AltReg: 0.7609, CorReg: 0.0912, TopReg: 0.5900, AllReg: 0.7609, BotRReg: 0.7898, OV: 0.3108, AltV: 0.0686, CorV: 0.6740, TopV: 0.2067, BotRV: 0.0069, AllV: 0.0686 +[2026-01-29T21:29:10.567151Z] Loop 160: Reg: 0.4931, AltReg: 0.7609, CorReg: 0.0914, TopReg: 0.5922, AllReg: 0.7609, BotRReg: 0.7896, OV: 0.3107, AltV: 0.0686, CorV: 0.6737, TopV: 0.2044, BotRV: 0.0071, AllV: 0.0686 +[2026-01-29T21:29:11.769627Z] Loop 161: Reg: 0.4933, AltReg: 0.7610, CorReg: 0.0917, TopReg: 0.5945, AllReg: 0.7610, BotRReg: 0.7894, OV: 0.3105, AltV: 0.0686, CorV: 0.6734, TopV: 0.2022, BotRV: 0.0073, AllV: 0.0686 +[2026-01-29T21:29:12.972220Z] Loop 162: Reg: 0.4935, AltReg: 0.7610, CorReg: 0.0922, TopReg: 0.5968, AllReg: 0.7610, BotRReg: 0.7893, OV: 0.3103, AltV: 0.0686, CorV: 0.6729, TopV: 0.1999, BotRV: 0.0074, AllV: 0.0686 +[2026-01-29T21:29:14.175026Z] Loop 163: Reg: 0.4937, AltReg: 0.7610, CorReg: 0.0926, TopReg: 0.5983, AllReg: 0.7610, BotRReg: 0.7892, OV: 0.3101, AltV: 0.0685, CorV: 0.6725, TopV: 0.1983, BotRV: 0.0075, AllV: 0.0685 +[2026-01-29T21:29:15.380421Z] Loop 164: Reg: 0.4937, AltReg: 0.7610, CorReg: 0.0928, TopReg: 0.5989, AllReg: 0.7610, BotRReg: 0.7891, OV: 0.3101, AltV: 0.0685, CorV: 0.6724, TopV: 0.1978, BotRV: 0.0076, AllV: 0.0685 +[2026-01-29T21:29:16.584647Z] Loop 165: Reg: 0.4937, AltReg: 0.7610, CorReg: 0.0926, TopReg: 0.5986, AllReg: 0.7610, BotRReg: 0.7891, OV: 0.3101, AltV: 0.0685, CorV: 0.6725, TopV: 0.1981, BotRV: 0.0076, AllV: 0.0685 +[2026-01-29T21:29:17.789763Z] Loop 166: Reg: 0.4934, AltReg: 0.7610, CorReg: 0.0919, TopReg: 0.5958, AllReg: 0.7610, BotRReg: 0.7893, OV: 0.3104, AltV: 0.0685, CorV: 0.6732, TopV: 0.2008, BotRV: 0.0073, AllV: 0.0685 +[2026-01-29T21:29:18.999076Z] Loop 167: Reg: 0.4931, AltReg: 0.7610, CorReg: 0.0913, TopReg: 0.5932, AllReg: 0.7610, BotRReg: 0.7895, OV: 0.3106, AltV: 0.0686, CorV: 0.6738, TopV: 0.2035, BotRV: 0.0071, AllV: 0.0686 +[2026-01-29T21:29:20.204367Z] Loop 168: Reg: 0.4929, AltReg: 0.7610, CorReg: 0.0909, TopReg: 0.5891, AllReg: 0.7610, BotRReg: 0.7898, OV: 0.3108, AltV: 0.0686, CorV: 0.6743, TopV: 0.2076, BotRV: 0.0068, AllV: 0.0686 +[2026-01-29T21:29:21.408677Z] Loop 169: Reg: 0.4929, AltReg: 0.7610, CorReg: 0.0908, TopReg: 0.5851, AllReg: 0.7610, BotRReg: 0.7901, OV: 0.3109, AltV: 0.0686, CorV: 0.6743, TopV: 0.2116, BotRV: 0.0066, AllV: 0.0686 +[2026-01-29T21:29:22.614308Z] Loop 170: Reg: 0.4931, AltReg: 0.7610, CorReg: 0.0912, TopReg: 0.5810, AllReg: 0.7610, BotRReg: 0.7904, OV: 0.3107, AltV: 0.0686, CorV: 0.6739, TopV: 0.2157, BotRV: 0.0063, AllV: 0.0686 +[2026-01-29T21:29:23.820352Z] Loop 171: Reg: 0.4933, AltReg: 0.7610, CorReg: 0.0917, TopReg: 0.5782, AllReg: 0.7610, BotRReg: 0.7906, OV: 0.3105, AltV: 0.0685, CorV: 0.6734, TopV: 0.2184, BotRV: 0.0061, AllV: 0.0685 +[2026-01-29T21:29:25.024004Z] Loop 172: Reg: 0.4935, AltReg: 0.7610, CorReg: 0.0922, TopReg: 0.5763, AllReg: 0.7610, BotRReg: 0.7907, OV: 0.3103, AltV: 0.0685, CorV: 0.6730, TopV: 0.2204, BotRV: 0.0060, AllV: 0.0685 +[2026-01-29T21:29:26.228058Z] Loop 173: Reg: 0.4936, AltReg: 0.7610, CorReg: 0.0925, TopReg: 0.5753, AllReg: 0.7610, BotRReg: 0.7908, OV: 0.3102, AltV: 0.0685, CorV: 0.6727, TopV: 0.2214, BotRV: 0.0059, AllV: 0.0685 +[2026-01-29T21:29:27.432898Z] Loop 174: Reg: 0.4937, AltReg: 0.7610, CorReg: 0.0927, TopReg: 0.5744, AllReg: 0.7610, BotRReg: 0.7908, OV: 0.3101, AltV: 0.0685, CorV: 0.6724, TopV: 0.2223, BotRV: 0.0059, AllV: 0.0685 +[2026-01-29T21:29:28.637177Z] Loop 175: Reg: 0.4937, AltReg: 0.7610, CorReg: 0.0927, TopReg: 0.5743, AllReg: 0.7610, BotRReg: 0.7908, OV: 0.3101, AltV: 0.0685, CorV: 0.6724, TopV: 0.2224, BotRV: 0.0059, AllV: 0.0685 +[2026-01-29T21:29:29.841338Z] Loop 176: Reg: 0.4937, AltReg: 0.7610, CorReg: 0.0927, TopReg: 0.5744, AllReg: 0.7610, BotRReg: 0.7908, OV: 0.3101, AltV: 0.0685, CorV: 0.6724, TopV: 0.2223, BotRV: 0.0059, AllV: 0.0685 +[2026-01-29T21:29:31.045406Z] Loop 177: Reg: 0.4935, AltReg: 0.7610, CorReg: 0.0922, TopReg: 0.5758, AllReg: 0.7610, BotRReg: 0.7907, OV: 0.3103, AltV: 0.0685, CorV: 0.6729, TopV: 0.2209, BotRV: 0.0060, AllV: 0.0685 +[2026-01-29T21:29:32.248062Z] Loop 178: Reg: 0.4933, AltReg: 0.7610, CorReg: 0.0918, TopReg: 0.5774, AllReg: 0.7610, BotRReg: 0.7906, OV: 0.3104, AltV: 0.0685, CorV: 0.6733, TopV: 0.2193, BotRV: 0.0061, AllV: 0.0685 +[2026-01-29T21:29:33.450575Z] Loop 179: Reg: 0.4932, AltReg: 0.7610, CorReg: 0.0914, TopReg: 0.5791, AllReg: 0.7610, BotRReg: 0.7905, OV: 0.3106, AltV: 0.0685, CorV: 0.6737, TopV: 0.2176, BotRV: 0.0062, AllV: 0.0685 +[2026-01-29T21:29:34.657536Z] Loop 180: Reg: 0.4930, AltReg: 0.7610, CorReg: 0.0911, TopReg: 0.5811, AllReg: 0.7610, BotRReg: 0.7904, OV: 0.3107, AltV: 0.0685, CorV: 0.6740, TopV: 0.2156, BotRV: 0.0063, AllV: 0.0685 +[2026-01-29T21:29:35.861951Z] Loop 181: Reg: 0.4930, AltReg: 0.7610, CorReg: 0.0909, TopReg: 0.5828, AllReg: 0.7610, BotRReg: 0.7903, OV: 0.3108, AltV: 0.0685, CorV: 0.6742, TopV: 0.2139, BotRV: 0.0064, AllV: 0.0685 +[2026-01-29T21:29:37.066621Z] Loop 182: Reg: 0.4929, AltReg: 0.7610, CorReg: 0.0907, TopReg: 0.5853, AllReg: 0.7610, BotRReg: 0.7901, OV: 0.3109, AltV: 0.0685, CorV: 0.6744, TopV: 0.2113, BotRV: 0.0066, AllV: 0.0685 +[2026-01-29T21:29:38.270583Z] Loop 183: Reg: 0.4929, AltReg: 0.7610, CorReg: 0.0906, TopReg: 0.5878, AllReg: 0.7610, BotRReg: 0.7899, OV: 0.3109, AltV: 0.0685, CorV: 0.6745, TopV: 0.2089, BotRV: 0.0067, AllV: 0.0685 +[2026-01-29T21:29:39.478364Z] Loop 184: Reg: 0.4929, AltReg: 0.7610, CorReg: 0.0908, TopReg: 0.5905, AllReg: 0.7610, BotRReg: 0.7897, OV: 0.3108, AltV: 0.0685, CorV: 0.6743, TopV: 0.2062, BotRV: 0.0069, AllV: 0.0685 +[2026-01-29T21:29:40.683519Z] Loop 185: Reg: 0.4931, AltReg: 0.7610, CorReg: 0.0911, TopReg: 0.5934, AllReg: 0.7610, BotRReg: 0.7895, OV: 0.3107, AltV: 0.0685, CorV: 0.6740, TopV: 0.2033, BotRV: 0.0071, AllV: 0.0685 +[2026-01-29T21:29:41.887610Z] Loop 186: Reg: 0.4933, AltReg: 0.7611, CorReg: 0.0916, TopReg: 0.5956, AllReg: 0.7611, BotRReg: 0.7894, OV: 0.3105, AltV: 0.0685, CorV: 0.6735, TopV: 0.2010, BotRV: 0.0073, AllV: 0.0685 +[2026-01-29T21:29:43.092069Z] Loop 187: Reg: 0.4933, AltReg: 0.7611, CorReg: 0.0917, TopReg: 0.5964, AllReg: 0.7611, BotRReg: 0.7893, OV: 0.3104, AltV: 0.0685, CorV: 0.6734, TopV: 0.2003, BotRV: 0.0074, AllV: 0.0685 +[2026-01-29T21:29:44.296214Z] Loop 188: Reg: 0.4933, AltReg: 0.7611, CorReg: 0.0917, TopReg: 0.5963, AllReg: 0.7611, BotRReg: 0.7893, OV: 0.3105, AltV: 0.0685, CorV: 0.6734, TopV: 0.2004, BotRV: 0.0074, AllV: 0.0685 +[2026-01-29T21:29:45.501894Z] Loop 189: Reg: 0.4932, AltReg: 0.7611, CorReg: 0.0915, TopReg: 0.5953, AllReg: 0.7611, BotRReg: 0.7894, OV: 0.3106, AltV: 0.0685, CorV: 0.6737, TopV: 0.2013, BotRV: 0.0073, AllV: 0.0685 +[2026-01-29T21:29:46.705829Z] Loop 190: Reg: 0.4931, AltReg: 0.7611, CorReg: 0.0912, TopReg: 0.5940, AllReg: 0.7611, BotRReg: 0.7895, OV: 0.3107, AltV: 0.0685, CorV: 0.6739, TopV: 0.2027, BotRV: 0.0072, AllV: 0.0685 +[2026-01-29T21:29:47.910811Z] Loop 191: Reg: 0.4931, AltReg: 0.7611, CorReg: 0.0911, TopReg: 0.5932, AllReg: 0.7611, BotRReg: 0.7896, OV: 0.3107, AltV: 0.0685, CorV: 0.6740, TopV: 0.2034, BotRV: 0.0071, AllV: 0.0685 +[2026-01-29T21:29:49.114652Z] Loop 192: Reg: 0.4929, AltReg: 0.7610, CorReg: 0.0907, TopReg: 0.5909, AllReg: 0.7610, BotRReg: 0.7897, OV: 0.3109, AltV: 0.0685, CorV: 0.6744, TopV: 0.2058, BotRV: 0.0070, AllV: 0.0685 +[2026-01-29T21:29:50.319543Z] Loop 193: Reg: 0.4928, AltReg: 0.7610, CorReg: 0.0905, TopReg: 0.5874, AllReg: 0.7610, BotRReg: 0.7900, OV: 0.3109, AltV: 0.0685, CorV: 0.6746, TopV: 0.2093, BotRV: 0.0067, AllV: 0.0685 +[2026-01-29T21:29:51.532472Z] Loop 194: Reg: 0.4929, AltReg: 0.7610, CorReg: 0.0907, TopReg: 0.5833, AllReg: 0.7610, BotRReg: 0.7903, OV: 0.3109, AltV: 0.0685, CorV: 0.6745, TopV: 0.2134, BotRV: 0.0064, AllV: 0.0685 +[2026-01-29T21:29:52.738254Z] Loop 195: Reg: 0.4931, AltReg: 0.7611, CorReg: 0.0911, TopReg: 0.5796, AllReg: 0.7611, BotRReg: 0.7905, OV: 0.3107, AltV: 0.0685, CorV: 0.6740, TopV: 0.2171, BotRV: 0.0062, AllV: 0.0685 +[2026-01-29T21:29:53.941222Z] Loop 196: Reg: 0.4932, AltReg: 0.7611, CorReg: 0.0915, TopReg: 0.5779, AllReg: 0.7611, BotRReg: 0.7906, OV: 0.3105, AltV: 0.0685, CorV: 0.6736, TopV: 0.2188, BotRV: 0.0061, AllV: 0.0685 +[2026-01-29T21:29:55.145319Z] Loop 197: Reg: 0.4932, AltReg: 0.7611, CorReg: 0.0915, TopReg: 0.5778, AllReg: 0.7611, BotRReg: 0.7906, OV: 0.3105, AltV: 0.0685, CorV: 0.6736, TopV: 0.2189, BotRV: 0.0061, AllV: 0.0685 +[2026-01-29T21:29:56.348979Z] Loop 198: Reg: 0.4932, AltReg: 0.7611, CorReg: 0.0913, TopReg: 0.5786, AllReg: 0.7611, BotRReg: 0.7906, OV: 0.3106, AltV: 0.0685, CorV: 0.6738, TopV: 0.2181, BotRV: 0.0061, AllV: 0.0685 +[2026-01-29T21:29:57.556455Z] Loop 199: Reg: 0.4931, AltReg: 0.7611, CorReg: 0.0911, TopReg: 0.5800, AllReg: 0.7611, BotRReg: 0.7905, OV: 0.3107, AltV: 0.0685, CorV: 0.6741, TopV: 0.2167, BotRV: 0.0062, AllV: 0.0685 +[2026-01-29T21:29:58.759737Z] Loop 200: Reg: 0.4929, AltReg: 0.7611, CorReg: 0.0908, TopReg: 0.5818, AllReg: 0.7611, BotRReg: 0.7904, OV: 0.3108, AltV: 0.0685, CorV: 0.6743, TopV: 0.2149, BotRV: 0.0063, AllV: 0.0685 +[2026-01-29T21:29:59.962941Z] Loop 201: Reg: 0.4929, AltReg: 0.7611, CorReg: 0.0906, TopReg: 0.5837, AllReg: 0.7611, BotRReg: 0.7902, OV: 0.3109, AltV: 0.0685, CorV: 0.6745, TopV: 0.2130, BotRV: 0.0065, AllV: 0.0685 +[2026-01-29T21:30:01.166017Z] Loop 202: Reg: 0.4928, AltReg: 0.7611, CorReg: 0.0905, TopReg: 0.5862, AllReg: 0.7611, BotRReg: 0.7901, OV: 0.3110, AltV: 0.0685, CorV: 0.6747, TopV: 0.2105, BotRV: 0.0066, AllV: 0.0685 +[2026-01-29T21:30:02.369430Z] Loop 203: Reg: 0.4928, AltReg: 0.7611, CorReg: 0.0905, TopReg: 0.5882, AllReg: 0.7611, BotRReg: 0.7899, OV: 0.3110, AltV: 0.0685, CorV: 0.6746, TopV: 0.2085, BotRV: 0.0068, AllV: 0.0685 +[2026-01-29T21:30:03.572463Z] Loop 204: Reg: 0.4929, AltReg: 0.7611, CorReg: 0.0906, TopReg: 0.5897, AllReg: 0.7611, BotRReg: 0.7898, OV: 0.3109, AltV: 0.0685, CorV: 0.6746, TopV: 0.2070, BotRV: 0.0069, AllV: 0.0685 +[2026-01-29T21:30:04.775509Z] Loop 205: Reg: 0.4929, AltReg: 0.7611, CorReg: 0.0906, TopReg: 0.5907, AllReg: 0.7611, BotRReg: 0.7897, OV: 0.3109, AltV: 0.0685, CorV: 0.6745, TopV: 0.2060, BotRV: 0.0069, AllV: 0.0685 +[2026-01-29T21:30:05.979216Z] Loop 206: Reg: 0.4930, AltReg: 0.7611, CorReg: 0.0908, TopReg: 0.5922, AllReg: 0.7611, BotRReg: 0.7896, OV: 0.3108, AltV: 0.0685, CorV: 0.6743, TopV: 0.2045, BotRV: 0.0070, AllV: 0.0685 +[2026-01-29T21:30:07.184150Z] Loop 207: Reg: 0.4930, AltReg: 0.7611, CorReg: 0.0910, TopReg: 0.5935, AllReg: 0.7611, BotRReg: 0.7895, OV: 0.3107, AltV: 0.0685, CorV: 0.6741, TopV: 0.2032, BotRV: 0.0071, AllV: 0.0685 +[2026-01-29T21:30:08.387075Z] Loop 208: Reg: 0.4930, AltReg: 0.7611, CorReg: 0.0909, TopReg: 0.5930, AllReg: 0.7611, BotRReg: 0.7896, OV: 0.3108, AltV: 0.0685, CorV: 0.6742, TopV: 0.2036, BotRV: 0.0071, AllV: 0.0685 +[2026-01-29T21:30:09.591417Z] Loop 209: Reg: 0.4929, AltReg: 0.7611, CorReg: 0.0908, TopReg: 0.5920, AllReg: 0.7611, BotRReg: 0.7897, OV: 0.3108, AltV: 0.0685, CorV: 0.6744, TopV: 0.2047, BotRV: 0.0070, AllV: 0.0685 +[2026-01-29T21:30:10.794443Z] Loop 210: Reg: 0.4929, AltReg: 0.7611, CorReg: 0.0906, TopReg: 0.5910, AllReg: 0.7611, BotRReg: 0.7897, OV: 0.3109, AltV: 0.0685, CorV: 0.6745, TopV: 0.2056, BotRV: 0.0070, AllV: 0.0685 +[2026-01-29T21:30:11.996686Z] Loop 211: Reg: 0.4929, AltReg: 0.7611, CorReg: 0.0905, TopReg: 0.5898, AllReg: 0.7611, BotRReg: 0.7898, OV: 0.3109, AltV: 0.0685, CorV: 0.6746, TopV: 0.2069, BotRV: 0.0069, AllV: 0.0685 +[2026-01-29T21:30:13.204466Z] Loop 212: Reg: 0.4928, AltReg: 0.7611, CorReg: 0.0904, TopReg: 0.5879, AllReg: 0.7611, BotRReg: 0.7899, OV: 0.3110, AltV: 0.0685, CorV: 0.6747, TopV: 0.2088, BotRV: 0.0067, AllV: 0.0685 +[2026-01-29T21:30:14.409346Z] Loop 213: Reg: 0.4928, AltReg: 0.7611, CorReg: 0.0904, TopReg: 0.5856, AllReg: 0.7611, BotRReg: 0.7901, OV: 0.3110, AltV: 0.0685, CorV: 0.6747, TopV: 0.2111, BotRV: 0.0066, AllV: 0.0685 +[2026-01-29T21:30:15.611090Z] Loop 214: Reg: 0.4928, AltReg: 0.7611, CorReg: 0.0905, TopReg: 0.5838, AllReg: 0.7611, BotRReg: 0.7902, OV: 0.3109, AltV: 0.0685, CorV: 0.6746, TopV: 0.2129, BotRV: 0.0065, AllV: 0.0685 +[2026-01-29T21:30:16.813680Z] Loop 215: Reg: 0.4929, AltReg: 0.7611, CorReg: 0.0906, TopReg: 0.5829, AllReg: 0.7611, BotRReg: 0.7903, OV: 0.3109, AltV: 0.0685, CorV: 0.6745, TopV: 0.2138, BotRV: 0.0064, AllV: 0.0685 +[2026-01-29T21:30:18.015177Z] Loop 216: Reg: 0.4929, AltReg: 0.7611, CorReg: 0.0907, TopReg: 0.5823, AllReg: 0.7611, BotRReg: 0.7903, OV: 0.3109, AltV: 0.0685, CorV: 0.6744, TopV: 0.2144, BotRV: 0.0064, AllV: 0.0685 +[2026-01-29T21:30:19.216779Z] Loop 217: Reg: 0.4930, AltReg: 0.7611, CorReg: 0.0909, TopReg: 0.5808, AllReg: 0.7611, BotRReg: 0.7904, OV: 0.3108, AltV: 0.0685, CorV: 0.6742, TopV: 0.2159, BotRV: 0.0063, AllV: 0.0685 +[2026-01-29T21:30:20.416712Z] Loop 218: Reg: 0.4930, AltReg: 0.7611, CorReg: 0.0909, TopReg: 0.5809, AllReg: 0.7611, BotRReg: 0.7904, OV: 0.3108, AltV: 0.0685, CorV: 0.6742, TopV: 0.2158, BotRV: 0.0063, AllV: 0.0685 +[2026-01-29T21:30:21.618896Z] Loop 219: Reg: 0.4930, AltReg: 0.7611, CorReg: 0.0909, TopReg: 0.5809, AllReg: 0.7611, BotRReg: 0.7904, OV: 0.3108, AltV: 0.0685, CorV: 0.6743, TopV: 0.2158, BotRV: 0.0063, AllV: 0.0685 +[2026-01-29T21:30:22.820701Z] Loop 220: Reg: 0.4929, AltReg: 0.7611, CorReg: 0.0908, TopReg: 0.5817, AllReg: 0.7611, BotRReg: 0.7904, OV: 0.3108, AltV: 0.0685, CorV: 0.6744, TopV: 0.2150, BotRV: 0.0063, AllV: 0.0685 +[2026-01-29T21:30:24.022241Z] Loop 221: Reg: 0.4929, AltReg: 0.7611, CorReg: 0.0906, TopReg: 0.5831, AllReg: 0.7611, BotRReg: 0.7903, OV: 0.3109, AltV: 0.0685, CorV: 0.6745, TopV: 0.2136, BotRV: 0.0064, AllV: 0.0685 +[2026-01-29T21:30:25.224034Z] Loop 222: Reg: 0.4928, AltReg: 0.7611, CorReg: 0.0905, TopReg: 0.5838, AllReg: 0.7611, BotRReg: 0.7902, OV: 0.3109, AltV: 0.0685, CorV: 0.6746, TopV: 0.2128, BotRV: 0.0065, AllV: 0.0685 +[2026-01-29T21:30:26.428177Z] Loop 223: Reg: 0.4928, AltReg: 0.7611, CorReg: 0.0905, TopReg: 0.5845, AllReg: 0.7611, BotRReg: 0.7902, OV: 0.3109, AltV: 0.0685, CorV: 0.6746, TopV: 0.2122, BotRV: 0.0065, AllV: 0.0685 +[2026-01-29T21:30:27.630813Z] Loop 224: Reg: 0.4928, AltReg: 0.7611, CorReg: 0.0905, TopReg: 0.5845, AllReg: 0.7611, BotRReg: 0.7902, OV: 0.3109, AltV: 0.0685, CorV: 0.6746, TopV: 0.2122, BotRV: 0.0065, AllV: 0.0685 +[2026-01-29T21:30:28.834911Z] Loop 225: Reg: 0.4928, AltReg: 0.7611, CorReg: 0.0905, TopReg: 0.5843, AllReg: 0.7611, BotRReg: 0.7902, OV: 0.3109, AltV: 0.0685, CorV: 0.6746, TopV: 0.2124, BotRV: 0.0065, AllV: 0.0685 +[2026-01-29T21:30:30.038734Z] Loop 226: Reg: 0.4928, AltReg: 0.7611, CorReg: 0.0905, TopReg: 0.5842, AllReg: 0.7611, BotRReg: 0.7902, OV: 0.3109, AltV: 0.0685, CorV: 0.6746, TopV: 0.2125, BotRV: 0.0065, AllV: 0.0685 +[2026-01-29T21:30:31.249058Z] Loop 227: Reg: 0.4928, AltReg: 0.7611, CorReg: 0.0905, TopReg: 0.5849, AllReg: 0.7611, BotRReg: 0.7902, OV: 0.3110, AltV: 0.0685, CorV: 0.6746, TopV: 0.2118, BotRV: 0.0065, AllV: 0.0685 +[2026-01-29T21:30:32.452774Z] Loop 228: Reg: 0.4928, AltReg: 0.7611, CorReg: 0.0904, TopReg: 0.5856, AllReg: 0.7611, BotRReg: 0.7901, OV: 0.3110, AltV: 0.0685, CorV: 0.6747, TopV: 0.2111, BotRV: 0.0066, AllV: 0.0685 +[2026-01-29T21:30:33.657689Z] Loop 229: Reg: 0.4928, AltReg: 0.7611, CorReg: 0.0904, TopReg: 0.5865, AllReg: 0.7611, BotRReg: 0.7900, OV: 0.3110, AltV: 0.0685, CorV: 0.6747, TopV: 0.2102, BotRV: 0.0066, AllV: 0.0685 +[2026-01-29T21:30:34.862210Z] Loop 230: Reg: 0.4928, AltReg: 0.7611, CorReg: 0.0904, TopReg: 0.5870, AllReg: 0.7611, BotRReg: 0.7900, OV: 0.3110, AltV: 0.0685, CorV: 0.6747, TopV: 0.2097, BotRV: 0.0067, AllV: 0.0685 +[2026-01-29T21:30:36.067224Z] Loop 231: Reg: 0.4928, AltReg: 0.7611, CorReg: 0.0905, TopReg: 0.5887, AllReg: 0.7611, BotRReg: 0.7899, OV: 0.3110, AltV: 0.0685, CorV: 0.6746, TopV: 0.2080, BotRV: 0.0068, AllV: 0.0685 +[2026-01-29T21:30:37.272473Z] Loop 232: Reg: 0.4928, AltReg: 0.7611, CorReg: 0.0905, TopReg: 0.5892, AllReg: 0.7611, BotRReg: 0.7899, OV: 0.3109, AltV: 0.0685, CorV: 0.6746, TopV: 0.2075, BotRV: 0.0068, AllV: 0.0685 +[2026-01-29T21:30:38.477866Z] Loop 233: Reg: 0.4928, AltReg: 0.7611, CorReg: 0.0905, TopReg: 0.5894, AllReg: 0.7611, BotRReg: 0.7898, OV: 0.3109, AltV: 0.0685, CorV: 0.6746, TopV: 0.2073, BotRV: 0.0068, AllV: 0.0685 +[2026-01-29T21:30:39.682929Z] Loop 234: Reg: 0.4929, AltReg: 0.7611, CorReg: 0.0906, TopReg: 0.5904, AllReg: 0.7611, BotRReg: 0.7898, OV: 0.3109, AltV: 0.0685, CorV: 0.6745, TopV: 0.2063, BotRV: 0.0069, AllV: 0.0685 +[2026-01-29T21:30:40.888785Z] Loop 235: Reg: 0.4929, AltReg: 0.7611, CorReg: 0.0907, TopReg: 0.5912, AllReg: 0.7611, BotRReg: 0.7897, OV: 0.3109, AltV: 0.0685, CorV: 0.6745, TopV: 0.2055, BotRV: 0.0070, AllV: 0.0685 +[2026-01-29T21:30:42.092181Z] Loop 236: Reg: 0.4929, AltReg: 0.7611, CorReg: 0.0907, TopReg: 0.5917, AllReg: 0.7611, BotRReg: 0.7897, OV: 0.3108, AltV: 0.0685, CorV: 0.6744, TopV: 0.2050, BotRV: 0.0070, AllV: 0.0685 +[2026-01-29T21:30:43.296314Z] Loop 237: Reg: 0.4929, AltReg: 0.7611, CorReg: 0.0907, TopReg: 0.5918, AllReg: 0.7611, BotRReg: 0.7897, OV: 0.3108, AltV: 0.0685, CorV: 0.6744, TopV: 0.2049, BotRV: 0.0070, AllV: 0.0685 +[2026-01-29T21:30:44.500265Z] Loop 238: Reg: 0.4929, AltReg: 0.7611, CorReg: 0.0907, TopReg: 0.5922, AllReg: 0.7611, BotRReg: 0.7896, OV: 0.3108, AltV: 0.0685, CorV: 0.6744, TopV: 0.2045, BotRV: 0.0070, AllV: 0.0685 +[2026-01-29T21:30:45.713480Z] Loop 239: Reg: 0.4930, AltReg: 0.7611, CorReg: 0.0908, TopReg: 0.5928, AllReg: 0.7611, BotRReg: 0.7896, OV: 0.3108, AltV: 0.0685, CorV: 0.6743, TopV: 0.2039, BotRV: 0.0071, AllV: 0.0685 +[2026-01-29T21:30:46.917140Z] Loop 240: Reg: 0.4930, AltReg: 0.7611, CorReg: 0.0908, TopReg: 0.5925, AllReg: 0.7611, BotRReg: 0.7896, OV: 0.3108, AltV: 0.0685, CorV: 0.6744, TopV: 0.2042, BotRV: 0.0071, AllV: 0.0685 +[2026-01-29T21:30:48.124565Z] Loop 241: Reg: 0.4929, AltReg: 0.7611, CorReg: 0.0906, TopReg: 0.5917, AllReg: 0.7611, BotRReg: 0.7897, OV: 0.3109, AltV: 0.0685, CorV: 0.6745, TopV: 0.2050, BotRV: 0.0070, AllV: 0.0685 +[2026-01-29T21:30:49.331450Z] Loop 242: Reg: 0.4928, AltReg: 0.7611, CorReg: 0.0905, TopReg: 0.5902, AllReg: 0.7611, BotRReg: 0.7898, OV: 0.3109, AltV: 0.0685, CorV: 0.6746, TopV: 0.2065, BotRV: 0.0069, AllV: 0.0685 +[2026-01-29T21:30:50.534646Z] Loop 243: Reg: 0.4928, AltReg: 0.7611, CorReg: 0.0903, TopReg: 0.5879, AllReg: 0.7611, BotRReg: 0.7900, OV: 0.3110, AltV: 0.0685, CorV: 0.6748, TopV: 0.2088, BotRV: 0.0067, AllV: 0.0685 +[2026-01-29T21:30:51.738034Z] Loop 244: Reg: 0.4928, AltReg: 0.7611, CorReg: 0.0903, TopReg: 0.5854, AllReg: 0.7611, BotRReg: 0.7901, OV: 0.3110, AltV: 0.0685, CorV: 0.6748, TopV: 0.2113, BotRV: 0.0066, AllV: 0.0685 +[2026-01-29T21:30:52.949332Z] Loop 245: Reg: 0.4928, AltReg: 0.7611, CorReg: 0.0905, TopReg: 0.5828, AllReg: 0.7611, BotRReg: 0.7903, OV: 0.3109, AltV: 0.0685, CorV: 0.6746, TopV: 0.2138, BotRV: 0.0064, AllV: 0.0685 +[2026-01-29T21:30:54.164768Z] Loop 246: Reg: 0.4930, AltReg: 0.7611, CorReg: 0.0908, TopReg: 0.5803, AllReg: 0.7611, BotRReg: 0.7905, OV: 0.3108, AltV: 0.0685, CorV: 0.6743, TopV: 0.2164, BotRV: 0.0062, AllV: 0.0685 +[2026-01-29T21:30:55.377873Z] Loop 247: Reg: 0.4930, AltReg: 0.7611, CorReg: 0.0909, TopReg: 0.5797, AllReg: 0.7611, BotRReg: 0.7905, OV: 0.3108, AltV: 0.0684, CorV: 0.6742, TopV: 0.2170, BotRV: 0.0062, AllV: 0.0684 +[2026-01-29T21:30:56.583086Z] Loop 248: Reg: 0.4930, AltReg: 0.7611, CorReg: 0.0908, TopReg: 0.5802, AllReg: 0.7611, BotRReg: 0.7905, OV: 0.3108, AltV: 0.0684, CorV: 0.6743, TopV: 0.2165, BotRV: 0.0062, AllV: 0.0684 +[2026-01-29T21:30:57.790331Z] Loop 249: Reg: 0.4930, AltReg: 0.7611, CorReg: 0.0908, TopReg: 0.5803, AllReg: 0.7611, BotRReg: 0.7905, OV: 0.3108, AltV: 0.0684, CorV: 0.6743, TopV: 0.2164, BotRV: 0.0062, AllV: 0.0684 +[2026-01-29T21:30:59.001150Z] Loop 250: Reg: 0.4929, AltReg: 0.7611, CorReg: 0.0906, TopReg: 0.5815, AllReg: 0.7611, BotRReg: 0.7904, OV: 0.3109, AltV: 0.0684, CorV: 0.6745, TopV: 0.2152, BotRV: 0.0063, AllV: 0.0684 +[2026-01-29T21:31:01.364853Z] Loop 252: Reg: 0.4928, AltReg: 0.7611, CorReg: 0.0902, TopReg: 0.5859, AllReg: 0.7611, BotRReg: 0.7901, OV: 0.3110, AltV: 0.0685, CorV: 0.6749, TopV: 0.2108, BotRV: 0.0066, AllV: 0.0685 +[2026-01-29T21:31:03.742957Z] Loop 254: Reg: 0.4928, AltReg: 0.7611, CorReg: 0.0903, TopReg: 0.5905, AllReg: 0.7611, BotRReg: 0.7898, OV: 0.3110, AltV: 0.0684, CorV: 0.6748, TopV: 0.2062, BotRV: 0.0069, AllV: 0.0684 +[2026-01-29T21:31:06.123334Z] Loop 256: Reg: 0.4931, AltReg: 0.7612, CorReg: 0.0909, TopReg: 0.5947, AllReg: 0.7612, BotRReg: 0.7895, OV: 0.3107, AltV: 0.0684, CorV: 0.6742, TopV: 0.2020, BotRV: 0.0072, AllV: 0.0684 +[2026-01-29T21:31:08.495753Z] Loop 258: Reg: 0.4930, AltReg: 0.7612, CorReg: 0.0909, TopReg: 0.5946, AllReg: 0.7612, BotRReg: 0.7895, OV: 0.3107, AltV: 0.0684, CorV: 0.6742, TopV: 0.2020, BotRV: 0.0072, AllV: 0.0684 +[2026-01-29T21:31:10.858091Z] Loop 260: Reg: 0.4929, AltReg: 0.7611, CorReg: 0.0905, TopReg: 0.5923, AllReg: 0.7611, BotRReg: 0.7897, OV: 0.3109, AltV: 0.0684, CorV: 0.6746, TopV: 0.2044, BotRV: 0.0070, AllV: 0.0684 +[2026-01-29T21:31:13.228847Z] Loop 262: Reg: 0.4928, AltReg: 0.7611, CorReg: 0.0902, TopReg: 0.5902, AllReg: 0.7611, BotRReg: 0.7898, OV: 0.3110, AltV: 0.0684, CorV: 0.6749, TopV: 0.2065, BotRV: 0.0069, AllV: 0.0684 +[2026-01-29T21:31:15.593223Z] Loop 264: Reg: 0.4927, AltReg: 0.7611, CorReg: 0.0900, TopReg: 0.5870, AllReg: 0.7611, BotRReg: 0.7900, OV: 0.3111, AltV: 0.0684, CorV: 0.6751, TopV: 0.2097, BotRV: 0.0067, AllV: 0.0684 +[2026-01-29T21:31:17.962897Z] Loop 266: Reg: 0.4927, AltReg: 0.7611, CorReg: 0.0901, TopReg: 0.5857, AllReg: 0.7611, BotRReg: 0.7901, OV: 0.3111, AltV: 0.0684, CorV: 0.6751, TopV: 0.2110, BotRV: 0.0066, AllV: 0.0684 +[2026-01-29T21:31:20.330376Z] Loop 268: Reg: 0.4927, AltReg: 0.7611, CorReg: 0.0900, TopReg: 0.5865, AllReg: 0.7611, BotRReg: 0.7901, OV: 0.3111, AltV: 0.0684, CorV: 0.6751, TopV: 0.2102, BotRV: 0.0066, AllV: 0.0684 +[2026-01-29T21:31:22.691445Z] Loop 270: Reg: 0.4927, AltReg: 0.7611, CorReg: 0.0900, TopReg: 0.5873, AllReg: 0.7611, BotRReg: 0.7900, OV: 0.3111, AltV: 0.0684, CorV: 0.6751, TopV: 0.2094, BotRV: 0.0067, AllV: 0.0684 +[2026-01-29T21:31:25.052290Z] Loop 272: Reg: 0.4927, AltReg: 0.7611, CorReg: 0.0900, TopReg: 0.5850, AllReg: 0.7611, BotRReg: 0.7902, OV: 0.3111, AltV: 0.0684, CorV: 0.6751, TopV: 0.2117, BotRV: 0.0065, AllV: 0.0684 +[2026-01-29T21:31:27.414667Z] Loop 274: Reg: 0.4928, AltReg: 0.7612, CorReg: 0.0902, TopReg: 0.5825, AllReg: 0.7612, BotRReg: 0.7903, OV: 0.3110, AltV: 0.0684, CorV: 0.6749, TopV: 0.2142, BotRV: 0.0064, AllV: 0.0684 +[2026-01-29T21:31:29.794187Z] Loop 276: Reg: 0.4929, AltReg: 0.7612, CorReg: 0.0905, TopReg: 0.5804, AllReg: 0.7612, BotRReg: 0.7905, OV: 0.3109, AltV: 0.0684, CorV: 0.6746, TopV: 0.2163, BotRV: 0.0062, AllV: 0.0684 +[2026-01-29T21:31:32.165564Z] Loop 278: Reg: 0.4929, AltReg: 0.7612, CorReg: 0.0905, TopReg: 0.5806, AllReg: 0.7612, BotRReg: 0.7905, OV: 0.3109, AltV: 0.0684, CorV: 0.6747, TopV: 0.2161, BotRV: 0.0062, AllV: 0.0684 +[2026-01-29T21:31:34.527928Z] Loop 280: Reg: 0.4927, AltReg: 0.7612, CorReg: 0.0901, TopReg: 0.5837, AllReg: 0.7612, BotRReg: 0.7903, OV: 0.3111, AltV: 0.0684, CorV: 0.6750, TopV: 0.2130, BotRV: 0.0064, AllV: 0.0684 +[2026-01-29T21:31:36.894837Z] Loop 282: Reg: 0.4927, AltReg: 0.7612, CorReg: 0.0900, TopReg: 0.5894, AllReg: 0.7612, BotRReg: 0.7899, OV: 0.3111, AltV: 0.0684, CorV: 0.6751, TopV: 0.2072, BotRV: 0.0068, AllV: 0.0684 +[2026-01-29T21:31:39.263323Z] Loop 284: Reg: 0.4930, AltReg: 0.7612, CorReg: 0.0906, TopReg: 0.5941, AllReg: 0.7612, BotRReg: 0.7895, OV: 0.3108, AltV: 0.0684, CorV: 0.6745, TopV: 0.2026, BotRV: 0.0072, AllV: 0.0684 +[2026-01-29T21:31:41.627881Z] Loop 286: Reg: 0.4934, AltReg: 0.7612, CorReg: 0.0915, TopReg: 0.5982, AllReg: 0.7612, BotRReg: 0.7892, OV: 0.3104, AltV: 0.0683, CorV: 0.6736, TopV: 0.1985, BotRV: 0.0075, AllV: 0.0683 +[2026-01-29T21:31:43.991022Z] Loop 288: Reg: 0.4931, AltReg: 0.7612, CorReg: 0.0909, TopReg: 0.5955, AllReg: 0.7612, BotRReg: 0.7894, OV: 0.3107, AltV: 0.0684, CorV: 0.6742, TopV: 0.2011, BotRV: 0.0073, AllV: 0.0684 +[2026-01-29T21:31:46.355998Z] Loop 290: Reg: 0.4927, AltReg: 0.7612, CorReg: 0.0900, TopReg: 0.5886, AllReg: 0.7612, BotRReg: 0.7899, OV: 0.3111, AltV: 0.0684, CorV: 0.6751, TopV: 0.2081, BotRV: 0.0068, AllV: 0.0684 +[2026-01-29T21:31:48.714629Z] Loop 292: Reg: 0.4929, AltReg: 0.7612, CorReg: 0.0904, TopReg: 0.5811, AllReg: 0.7612, BotRReg: 0.7904, OV: 0.3109, AltV: 0.0684, CorV: 0.6747, TopV: 0.2156, BotRV: 0.0063, AllV: 0.0684 +[2026-01-29T21:31:51.076547Z] Loop 294: Reg: 0.4933, AltReg: 0.7612, CorReg: 0.0915, TopReg: 0.5761, AllReg: 0.7612, BotRReg: 0.7908, OV: 0.3105, AltV: 0.0684, CorV: 0.6737, TopV: 0.2206, BotRV: 0.0059, AllV: 0.0684 +[2026-01-29T21:31:53.438388Z] Loop 296: Reg: 0.4936, AltReg: 0.7612, CorReg: 0.0921, TopReg: 0.5739, AllReg: 0.7612, BotRReg: 0.7909, OV: 0.3102, AltV: 0.0683, CorV: 0.6730, TopV: 0.2228, BotRV: 0.0058, AllV: 0.0683 +[2026-01-29T21:31:55.799584Z] Loop 298: Reg: 0.4932, AltReg: 0.7612, CorReg: 0.0912, TopReg: 0.5772, AllReg: 0.7612, BotRReg: 0.7907, OV: 0.3106, AltV: 0.0684, CorV: 0.6739, TopV: 0.2195, BotRV: 0.0060, AllV: 0.0684 +[2026-01-29T21:31:58.166776Z] Loop 300: Reg: 0.4929, AltReg: 0.7612, CorReg: 0.0905, TopReg: 0.5804, AllReg: 0.7612, BotRReg: 0.7905, OV: 0.3109, AltV: 0.0684, CorV: 0.6746, TopV: 0.2163, BotRV: 0.0062, AllV: 0.0684 +[2026-01-29T21:32:00.537919Z] Loop 302: Reg: 0.4927, AltReg: 0.7612, CorReg: 0.0900, TopReg: 0.5862, AllReg: 0.7612, BotRReg: 0.7901, OV: 0.3111, AltV: 0.0684, CorV: 0.6752, TopV: 0.2105, BotRV: 0.0066, AllV: 0.0684 +[2026-01-29T21:32:02.901699Z] Loop 304: Reg: 0.4928, AltReg: 0.7612, CorReg: 0.0902, TopReg: 0.5915, AllReg: 0.7612, BotRReg: 0.7897, OV: 0.3110, AltV: 0.0684, CorV: 0.6749, TopV: 0.2052, BotRV: 0.0070, AllV: 0.0684 +[2026-01-29T21:32:05.269395Z] Loop 306: Reg: 0.4930, AltReg: 0.7612, CorReg: 0.0908, TopReg: 0.5952, AllReg: 0.7612, BotRReg: 0.7895, OV: 0.3107, AltV: 0.0684, CorV: 0.6743, TopV: 0.2015, BotRV: 0.0072, AllV: 0.0684 +[2026-01-29T21:32:07.633372Z] Loop 308: Reg: 0.4932, AltReg: 0.7612, CorReg: 0.0911, TopReg: 0.5967, AllReg: 0.7612, BotRReg: 0.7893, OV: 0.3106, AltV: 0.0683, CorV: 0.6740, TopV: 0.2000, BotRV: 0.0073, AllV: 0.0683 +[2026-01-29T21:32:09.995290Z] Loop 310: Reg: 0.4935, AltReg: 0.7612, CorReg: 0.0918, TopReg: 0.5992, AllReg: 0.7612, BotRReg: 0.7892, OV: 0.3103, AltV: 0.0683, CorV: 0.6733, TopV: 0.1974, BotRV: 0.0075, AllV: 0.0683 +[2026-01-29T21:32:12.359475Z] Loop 312: Reg: 0.4933, AltReg: 0.7612, CorReg: 0.0915, TopReg: 0.5981, AllReg: 0.7612, BotRReg: 0.7892, OV: 0.3104, AltV: 0.0683, CorV: 0.6736, TopV: 0.1985, BotRV: 0.0075, AllV: 0.0683 +[2026-01-29T21:32:14.723768Z] Loop 314: Reg: 0.4928, AltReg: 0.7612, CorReg: 0.0903, TopReg: 0.5922, AllReg: 0.7612, BotRReg: 0.7897, OV: 0.3110, AltV: 0.0684, CorV: 0.6749, TopV: 0.2045, BotRV: 0.0070, AllV: 0.0684 +[2026-01-29T21:32:17.092494Z] Loop 316: Reg: 0.4927, AltReg: 0.7612, CorReg: 0.0899, TopReg: 0.5852, AllReg: 0.7612, BotRReg: 0.7902, OV: 0.3111, AltV: 0.0684, CorV: 0.6752, TopV: 0.2114, BotRV: 0.0065, AllV: 0.0684 +[2026-01-29T21:32:19.457364Z] Loop 318: Reg: 0.4930, AltReg: 0.7612, CorReg: 0.0906, TopReg: 0.5792, AllReg: 0.7612, BotRReg: 0.7906, OV: 0.3108, AltV: 0.0684, CorV: 0.6745, TopV: 0.2175, BotRV: 0.0061, AllV: 0.0684 +[2026-01-29T21:32:21.831400Z] Loop 320: Reg: 0.4933, AltReg: 0.7612, CorReg: 0.0914, TopReg: 0.5761, AllReg: 0.7612, BotRReg: 0.7908, OV: 0.3105, AltV: 0.0683, CorV: 0.6737, TopV: 0.2206, BotRV: 0.0059, AllV: 0.0683 +[2026-01-29T21:32:24.194047Z] Loop 322: Reg: 0.4928, AltReg: 0.7612, CorReg: 0.0903, TopReg: 0.5809, AllReg: 0.7612, BotRReg: 0.7904, OV: 0.3109, AltV: 0.0684, CorV: 0.6748, TopV: 0.2158, BotRV: 0.0062, AllV: 0.0684 +[2026-01-29T21:32:26.563685Z] Loop 324: Reg: 0.4927, AltReg: 0.7612, CorReg: 0.0899, TopReg: 0.5883, AllReg: 0.7612, BotRReg: 0.7899, OV: 0.3111, AltV: 0.0684, CorV: 0.6752, TopV: 0.2084, BotRV: 0.0067, AllV: 0.0684 +[2026-01-29T21:32:28.929108Z] Loop 326: Reg: 0.4929, AltReg: 0.7612, CorReg: 0.0903, TopReg: 0.5931, AllReg: 0.7612, BotRReg: 0.7896, OV: 0.3109, AltV: 0.0684, CorV: 0.6748, TopV: 0.2036, BotRV: 0.0071, AllV: 0.0684 +[2026-01-29T21:32:31.298971Z] Loop 328: Reg: 0.4929, AltReg: 0.7612, CorReg: 0.0905, TopReg: 0.5941, AllReg: 0.7612, BotRReg: 0.7895, OV: 0.3109, AltV: 0.0683, CorV: 0.6746, TopV: 0.2026, BotRV: 0.0072, AllV: 0.0683 +[2026-01-29T21:32:33.674895Z] Loop 330: Reg: 0.4929, AltReg: 0.7612, CorReg: 0.0904, TopReg: 0.5935, AllReg: 0.7612, BotRReg: 0.7896, OV: 0.3109, AltV: 0.0683, CorV: 0.6747, TopV: 0.2031, BotRV: 0.0071, AllV: 0.0683 +[2026-01-29T21:32:36.044645Z] Loop 332: Reg: 0.4927, AltReg: 0.7612, CorReg: 0.0900, TopReg: 0.5900, AllReg: 0.7612, BotRReg: 0.7898, OV: 0.3111, AltV: 0.0684, CorV: 0.6752, TopV: 0.2067, BotRV: 0.0069, AllV: 0.0684 +[2026-01-29T21:32:38.404918Z] Loop 334: Reg: 0.4927, AltReg: 0.7612, CorReg: 0.0899, TopReg: 0.5844, AllReg: 0.7612, BotRReg: 0.7902, OV: 0.3111, AltV: 0.0684, CorV: 0.6752, TopV: 0.2123, BotRV: 0.0065, AllV: 0.0684 +[2026-01-29T21:32:40.770803Z] Loop 336: Reg: 0.4929, AltReg: 0.7612, CorReg: 0.0905, TopReg: 0.5798, AllReg: 0.7612, BotRReg: 0.7905, OV: 0.3109, AltV: 0.0684, CorV: 0.6746, TopV: 0.2169, BotRV: 0.0062, AllV: 0.0684 +[2026-01-29T21:32:43.136767Z] Loop 338: Reg: 0.4931, AltReg: 0.7612, CorReg: 0.0908, TopReg: 0.5781, AllReg: 0.7612, BotRReg: 0.7906, OV: 0.3107, AltV: 0.0683, CorV: 0.6743, TopV: 0.2186, BotRV: 0.0061, AllV: 0.0683 +[2026-01-29T21:32:45.497781Z] Loop 340: Reg: 0.4928, AltReg: 0.7612, CorReg: 0.0902, TopReg: 0.5819, AllReg: 0.7612, BotRReg: 0.7904, OV: 0.3110, AltV: 0.0684, CorV: 0.6750, TopV: 0.2148, BotRV: 0.0063, AllV: 0.0684 +[2026-01-29T21:32:47.862184Z] Loop 342: Reg: 0.4926, AltReg: 0.7612, CorReg: 0.0899, TopReg: 0.5877, AllReg: 0.7612, BotRReg: 0.7900, OV: 0.3111, AltV: 0.0684, CorV: 0.6753, TopV: 0.2090, BotRV: 0.0067, AllV: 0.0684 +[2026-01-29T21:32:50.230303Z] Loop 344: Reg: 0.4927, AltReg: 0.7612, CorReg: 0.0900, TopReg: 0.5908, AllReg: 0.7612, BotRReg: 0.7898, OV: 0.3111, AltV: 0.0684, CorV: 0.6751, TopV: 0.2059, BotRV: 0.0069, AllV: 0.0684 +[2026-01-29T21:32:52.591363Z] Loop 346: Reg: 0.4928, AltReg: 0.7612, CorReg: 0.0901, TopReg: 0.5917, AllReg: 0.7612, BotRReg: 0.7897, OV: 0.3110, AltV: 0.0684, CorV: 0.6750, TopV: 0.2050, BotRV: 0.0070, AllV: 0.0684 +[2026-01-29T21:32:54.957056Z] Loop 348: Reg: 0.4927, AltReg: 0.7612, CorReg: 0.0900, TopReg: 0.5907, AllReg: 0.7612, BotRReg: 0.7898, OV: 0.3111, AltV: 0.0684, CorV: 0.6751, TopV: 0.2060, BotRV: 0.0069, AllV: 0.0684 +[2026-01-29T21:32:57.318303Z] Loop 350: Reg: 0.4926, AltReg: 0.7612, CorReg: 0.0898, TopReg: 0.5886, AllReg: 0.7612, BotRReg: 0.7899, OV: 0.3111, AltV: 0.0684, CorV: 0.6753, TopV: 0.2081, BotRV: 0.0068, AllV: 0.0684 +[2026-01-29T21:32:59.681013Z] Loop 352: Reg: 0.4926, AltReg: 0.7612, CorReg: 0.0898, TopReg: 0.5866, AllReg: 0.7612, BotRReg: 0.7901, OV: 0.3111, AltV: 0.0684, CorV: 0.6753, TopV: 0.2101, BotRV: 0.0066, AllV: 0.0684 +[2026-01-29T21:33:02.053701Z] Loop 354: Reg: 0.4927, AltReg: 0.7612, CorReg: 0.0900, TopReg: 0.5829, AllReg: 0.7612, BotRReg: 0.7903, OV: 0.3111, AltV: 0.0684, CorV: 0.6751, TopV: 0.2137, BotRV: 0.0064, AllV: 0.0684 +[2026-01-29T21:33:04.431665Z] Loop 356: Reg: 0.4928, AltReg: 0.7612, CorReg: 0.0903, TopReg: 0.5808, AllReg: 0.7612, BotRReg: 0.7905, OV: 0.3110, AltV: 0.0684, CorV: 0.6749, TopV: 0.2159, BotRV: 0.0062, AllV: 0.0684 +[2026-01-29T21:33:06.803697Z] Loop 358: Reg: 0.4928, AltReg: 0.7612, CorReg: 0.0902, TopReg: 0.5810, AllReg: 0.7612, BotRReg: 0.7904, OV: 0.3110, AltV: 0.0684, CorV: 0.6749, TopV: 0.2157, BotRV: 0.0062, AllV: 0.0684 +[2026-01-29T21:33:09.167160Z] Loop 360: Reg: 0.4927, AltReg: 0.7612, CorReg: 0.0900, TopReg: 0.5825, AllReg: 0.7612, BotRReg: 0.7903, OV: 0.3111, AltV: 0.0684, CorV: 0.6751, TopV: 0.2142, BotRV: 0.0063, AllV: 0.0684 +[2026-01-29T21:33:11.525476Z] Loop 362: Reg: 0.4926, AltReg: 0.7612, CorReg: 0.0898, TopReg: 0.5867, AllReg: 0.7612, BotRReg: 0.7901, OV: 0.3112, AltV: 0.0684, CorV: 0.6754, TopV: 0.2100, BotRV: 0.0066, AllV: 0.0684 +[2026-01-29T21:33:13.896921Z] Loop 364: Reg: 0.4926, AltReg: 0.7612, CorReg: 0.0898, TopReg: 0.5889, AllReg: 0.7612, BotRReg: 0.7899, OV: 0.3111, AltV: 0.0684, CorV: 0.6753, TopV: 0.2078, BotRV: 0.0068, AllV: 0.0684 +[2026-01-29T21:33:16.271367Z] Loop 366: Reg: 0.4926, AltReg: 0.7612, CorReg: 0.0898, TopReg: 0.5885, AllReg: 0.7612, BotRReg: 0.7899, OV: 0.3111, AltV: 0.0684, CorV: 0.6753, TopV: 0.2082, BotRV: 0.0067, AllV: 0.0684 +[2026-01-29T21:33:18.639763Z] Loop 368: Reg: 0.4926, AltReg: 0.7612, CorReg: 0.0897, TopReg: 0.5866, AllReg: 0.7612, BotRReg: 0.7901, OV: 0.3112, AltV: 0.0684, CorV: 0.6754, TopV: 0.2101, BotRV: 0.0066, AllV: 0.0684 +[2026-01-29T21:33:21.007581Z] Loop 370: Reg: 0.4926, AltReg: 0.7612, CorReg: 0.0898, TopReg: 0.5847, AllReg: 0.7612, BotRReg: 0.7902, OV: 0.3111, AltV: 0.0684, CorV: 0.6753, TopV: 0.2120, BotRV: 0.0065, AllV: 0.0684 +[2026-01-29T21:33:23.371568Z] Loop 372: Reg: 0.4927, AltReg: 0.7612, CorReg: 0.0899, TopReg: 0.5839, AllReg: 0.7612, BotRReg: 0.7903, OV: 0.3111, AltV: 0.0684, CorV: 0.6752, TopV: 0.2128, BotRV: 0.0064, AllV: 0.0684 +[2026-01-29T21:33:25.742063Z] Loop 374: Reg: 0.4926, AltReg: 0.7612, CorReg: 0.0898, TopReg: 0.5853, AllReg: 0.7612, BotRReg: 0.7902, OV: 0.3112, AltV: 0.0684, CorV: 0.6753, TopV: 0.2114, BotRV: 0.0065, AllV: 0.0684 +[2026-01-29T21:33:28.108448Z] Loop 376: Reg: 0.4926, AltReg: 0.7612, CorReg: 0.0898, TopReg: 0.5852, AllReg: 0.7612, BotRReg: 0.7902, OV: 0.3111, AltV: 0.0684, CorV: 0.6753, TopV: 0.2115, BotRV: 0.0065, AllV: 0.0684 +[2026-01-29T21:33:30.471410Z] Loop 378: Reg: 0.4926, AltReg: 0.7612, CorReg: 0.0898, TopReg: 0.5868, AllReg: 0.7612, BotRReg: 0.7901, OV: 0.3112, AltV: 0.0684, CorV: 0.6754, TopV: 0.2099, BotRV: 0.0066, AllV: 0.0684 +[2026-01-29T21:33:32.836055Z] Loop 380: Reg: 0.4926, AltReg: 0.7612, CorReg: 0.0898, TopReg: 0.5887, AllReg: 0.7612, BotRReg: 0.7899, OV: 0.3111, AltV: 0.0684, CorV: 0.6753, TopV: 0.2080, BotRV: 0.0068, AllV: 0.0684 +[2026-01-29T21:33:35.211469Z] Loop 382: Reg: 0.4927, AltReg: 0.7612, CorReg: 0.0899, TopReg: 0.5900, AllReg: 0.7612, BotRReg: 0.7898, OV: 0.3111, AltV: 0.0684, CorV: 0.6752, TopV: 0.2067, BotRV: 0.0069, AllV: 0.0684 +[2026-01-29T21:33:37.582885Z] Loop 384: Reg: 0.4927, AltReg: 0.7612, CorReg: 0.0900, TopReg: 0.5916, AllReg: 0.7612, BotRReg: 0.7897, OV: 0.3110, AltV: 0.0683, CorV: 0.6751, TopV: 0.2051, BotRV: 0.0070, AllV: 0.0683 +[2026-01-29T21:33:39.952412Z] Loop 386: Reg: 0.4928, AltReg: 0.7612, CorReg: 0.0902, TopReg: 0.5932, AllReg: 0.7612, BotRReg: 0.7896, OV: 0.3110, AltV: 0.0683, CorV: 0.6749, TopV: 0.2035, BotRV: 0.0071, AllV: 0.0683 +[2026-01-29T21:33:42.316682Z] Loop 388: Reg: 0.4927, AltReg: 0.7612, CorReg: 0.0900, TopReg: 0.5915, AllReg: 0.7612, BotRReg: 0.7897, OV: 0.3111, AltV: 0.0684, CorV: 0.6751, TopV: 0.2052, BotRV: 0.0070, AllV: 0.0684 +[2026-01-29T21:33:44.689801Z] Loop 390: Reg: 0.4927, AltReg: 0.7612, CorReg: 0.0898, TopReg: 0.5896, AllReg: 0.7612, BotRReg: 0.7899, OV: 0.3111, AltV: 0.0684, CorV: 0.6753, TopV: 0.2071, BotRV: 0.0068, AllV: 0.0684 +[2026-01-29T21:33:47.049235Z] Loop 392: Reg: 0.4926, AltReg: 0.7612, CorReg: 0.0898, TopReg: 0.5865, AllReg: 0.7612, BotRReg: 0.7901, OV: 0.3112, AltV: 0.0684, CorV: 0.6754, TopV: 0.2102, BotRV: 0.0066, AllV: 0.0684 +[2026-01-29T21:33:49.415027Z] Loop 394: Reg: 0.4927, AltReg: 0.7612, CorReg: 0.0899, TopReg: 0.5837, AllReg: 0.7612, BotRReg: 0.7903, OV: 0.3111, AltV: 0.0684, CorV: 0.6752, TopV: 0.2129, BotRV: 0.0064, AllV: 0.0684 +[2026-01-29T21:33:51.781675Z] Loop 396: Reg: 0.4928, AltReg: 0.7612, CorReg: 0.0902, TopReg: 0.5808, AllReg: 0.7612, BotRReg: 0.7905, OV: 0.3110, AltV: 0.0684, CorV: 0.6749, TopV: 0.2159, BotRV: 0.0062, AllV: 0.0684 +[2026-01-29T21:33:54.142145Z] Loop 398: Reg: 0.4928, AltReg: 0.7612, CorReg: 0.0903, TopReg: 0.5805, AllReg: 0.7612, BotRReg: 0.7905, OV: 0.3109, AltV: 0.0684, CorV: 0.6748, TopV: 0.2162, BotRV: 0.0062, AllV: 0.0684 +[2026-01-29T21:33:56.500988Z] Loop 400: Reg: 0.4928, AltReg: 0.7612, CorReg: 0.0901, TopReg: 0.5814, AllReg: 0.7612, BotRReg: 0.7904, OV: 0.3110, AltV: 0.0684, CorV: 0.6750, TopV: 0.2153, BotRV: 0.0063, AllV: 0.0684 +[2026-01-29T21:33:58.870066Z] Loop 402: Reg: 0.4927, AltReg: 0.7612, CorReg: 0.0900, TopReg: 0.5822, AllReg: 0.7612, BotRReg: 0.7904, OV: 0.3111, AltV: 0.0684, CorV: 0.6751, TopV: 0.2145, BotRV: 0.0063, AllV: 0.0684 +[2026-01-29T21:34:01.231147Z] Loop 404: Reg: 0.4927, AltReg: 0.7612, CorReg: 0.0900, TopReg: 0.5822, AllReg: 0.7612, BotRReg: 0.7904, OV: 0.3111, AltV: 0.0684, CorV: 0.6751, TopV: 0.2144, BotRV: 0.0063, AllV: 0.0684 +[2026-01-29T21:34:03.594853Z] Loop 406: Reg: 0.4928, AltReg: 0.7612, CorReg: 0.0901, TopReg: 0.5812, AllReg: 0.7612, BotRReg: 0.7904, OV: 0.3110, AltV: 0.0684, CorV: 0.6750, TopV: 0.2155, BotRV: 0.0063, AllV: 0.0684 +[2026-01-29T21:34:05.955337Z] Loop 408: Reg: 0.4927, AltReg: 0.7612, CorReg: 0.0900, TopReg: 0.5820, AllReg: 0.7612, BotRReg: 0.7904, OV: 0.3111, AltV: 0.0684, CorV: 0.6751, TopV: 0.2147, BotRV: 0.0063, AllV: 0.0684 +[2026-01-29T21:34:08.316882Z] Loop 410: Reg: 0.4926, AltReg: 0.7612, CorReg: 0.0897, TopReg: 0.5851, AllReg: 0.7612, BotRReg: 0.7902, OV: 0.3112, AltV: 0.0684, CorV: 0.6754, TopV: 0.2116, BotRV: 0.0065, AllV: 0.0684 +[2026-01-29T21:34:10.681644Z] Loop 412: Reg: 0.4926, AltReg: 0.7612, CorReg: 0.0898, TopReg: 0.5900, AllReg: 0.7612, BotRReg: 0.7898, OV: 0.3111, AltV: 0.0683, CorV: 0.6753, TopV: 0.2067, BotRV: 0.0068, AllV: 0.0683 +[2026-01-29T21:34:13.041341Z] Loop 414: Reg: 0.4929, AltReg: 0.7612, CorReg: 0.0904, TopReg: 0.5943, AllReg: 0.7612, BotRReg: 0.7895, OV: 0.3109, AltV: 0.0683, CorV: 0.6747, TopV: 0.2024, BotRV: 0.0072, AllV: 0.0683 +[2026-01-29T21:34:15.402902Z] Loop 416: Reg: 0.4933, AltReg: 0.7613, CorReg: 0.0913, TopReg: 0.5983, AllReg: 0.7613, BotRReg: 0.7892, OV: 0.3105, AltV: 0.0683, CorV: 0.6738, TopV: 0.1984, BotRV: 0.0074, AllV: 0.0683 +[2026-01-29T21:34:17.761687Z] Loop 418: Reg: 0.4931, AltReg: 0.7613, CorReg: 0.0908, TopReg: 0.5967, AllReg: 0.7613, BotRReg: 0.7894, OV: 0.3107, AltV: 0.0683, CorV: 0.6743, TopV: 0.2000, BotRV: 0.0073, AllV: 0.0683 +[2026-01-29T21:34:20.120372Z] Loop 420: Reg: 0.4927, AltReg: 0.7612, CorReg: 0.0898, TopReg: 0.5910, AllReg: 0.7612, BotRReg: 0.7898, OV: 0.3111, AltV: 0.0683, CorV: 0.6753, TopV: 0.2057, BotRV: 0.0069, AllV: 0.0683 +[2026-01-29T21:34:22.482595Z] Loop 422: Reg: 0.4926, AltReg: 0.7612, CorReg: 0.0897, TopReg: 0.5851, AllReg: 0.7612, BotRReg: 0.7902, OV: 0.3112, AltV: 0.0683, CorV: 0.6755, TopV: 0.2115, BotRV: 0.0065, AllV: 0.0683 +[2026-01-29T21:34:24.850013Z] Loop 424: Reg: 0.4928, AltReg: 0.7612, CorReg: 0.0902, TopReg: 0.5800, AllReg: 0.7612, BotRReg: 0.7905, OV: 0.3110, AltV: 0.0683, CorV: 0.6749, TopV: 0.2167, BotRV: 0.0062, AllV: 0.0683 +[2026-01-29T21:34:27.215559Z] Loop 426: Reg: 0.4932, AltReg: 0.7613, CorReg: 0.0911, TopReg: 0.5762, AllReg: 0.7613, BotRReg: 0.7908, OV: 0.3106, AltV: 0.0683, CorV: 0.6740, TopV: 0.2205, BotRV: 0.0059, AllV: 0.0683 +[2026-01-29T21:34:29.579998Z] Loop 428: Reg: 0.4930, AltReg: 0.7612, CorReg: 0.0907, TopReg: 0.5778, AllReg: 0.7612, BotRReg: 0.7907, OV: 0.3108, AltV: 0.0683, CorV: 0.6745, TopV: 0.2189, BotRV: 0.0060, AllV: 0.0683 +[2026-01-29T21:34:31.941061Z] Loop 430: Reg: 0.4926, AltReg: 0.7612, CorReg: 0.0897, TopReg: 0.5834, AllReg: 0.7612, BotRReg: 0.7903, OV: 0.3112, AltV: 0.0683, CorV: 0.6754, TopV: 0.2133, BotRV: 0.0064, AllV: 0.0683 +[2026-01-29T21:34:34.302530Z] Loop 432: Reg: 0.4926, AltReg: 0.7612, CorReg: 0.0897, TopReg: 0.5899, AllReg: 0.7612, BotRReg: 0.7899, OV: 0.3112, AltV: 0.0683, CorV: 0.6754, TopV: 0.2068, BotRV: 0.0068, AllV: 0.0683 +[2026-01-29T21:34:36.663779Z] Loop 434: Reg: 0.4930, AltReg: 0.7613, CorReg: 0.0906, TopReg: 0.5963, AllReg: 0.7613, BotRReg: 0.7894, OV: 0.3108, AltV: 0.0683, CorV: 0.6745, TopV: 0.2004, BotRV: 0.0073, AllV: 0.0683 +[2026-01-29T21:34:39.027115Z] Loop 436: Reg: 0.4931, AltReg: 0.7613, CorReg: 0.0908, TopReg: 0.5972, AllReg: 0.7613, BotRReg: 0.7893, OV: 0.3107, AltV: 0.0683, CorV: 0.6743, TopV: 0.1995, BotRV: 0.0074, AllV: 0.0683 +[2026-01-29T21:34:41.400395Z] Loop 438: Reg: 0.4927, AltReg: 0.7613, CorReg: 0.0898, TopReg: 0.5920, AllReg: 0.7613, BotRReg: 0.7897, OV: 0.3111, AltV: 0.0683, CorV: 0.6753, TopV: 0.2046, BotRV: 0.0070, AllV: 0.0683 +[2026-01-29T21:34:43.767980Z] Loop 440: Reg: 0.4926, AltReg: 0.7612, CorReg: 0.0895, TopReg: 0.5883, AllReg: 0.7612, BotRReg: 0.7900, OV: 0.3112, AltV: 0.0683, CorV: 0.6756, TopV: 0.2084, BotRV: 0.0067, AllV: 0.0683 +[2026-01-29T21:34:46.136785Z] Loop 442: Reg: 0.4925, AltReg: 0.7612, CorReg: 0.0895, TopReg: 0.5878, AllReg: 0.7612, BotRReg: 0.7900, OV: 0.3112, AltV: 0.0683, CorV: 0.6756, TopV: 0.2089, BotRV: 0.0067, AllV: 0.0683 +[2026-01-29T21:34:48.500319Z] Loop 444: Reg: 0.4925, AltReg: 0.7612, CorReg: 0.0895, TopReg: 0.5872, AllReg: 0.7612, BotRReg: 0.7900, OV: 0.3112, AltV: 0.0683, CorV: 0.6756, TopV: 0.2095, BotRV: 0.0066, AllV: 0.0683 +[2026-01-29T21:34:50.859700Z] Loop 446: Reg: 0.4925, AltReg: 0.7612, CorReg: 0.0895, TopReg: 0.5861, AllReg: 0.7612, BotRReg: 0.7901, OV: 0.3112, AltV: 0.0683, CorV: 0.6756, TopV: 0.2106, BotRV: 0.0066, AllV: 0.0683 +[2026-01-29T21:34:53.216959Z] Loop 448: Reg: 0.4926, AltReg: 0.7612, CorReg: 0.0895, TopReg: 0.5852, AllReg: 0.7612, BotRReg: 0.7902, OV: 0.3112, AltV: 0.0683, CorV: 0.6756, TopV: 0.2115, BotRV: 0.0065, AllV: 0.0683 +[2026-01-29T21:34:55.573178Z] Loop 450: Reg: 0.4926, AltReg: 0.7612, CorReg: 0.0897, TopReg: 0.5908, AllReg: 0.7612, BotRReg: 0.7898, OV: 0.3112, AltV: 0.0683, CorV: 0.6755, TopV: 0.2059, BotRV: 0.0069, AllV: 0.0683 +[2026-01-29T21:34:57.931275Z] Loop 452: Reg: 0.4929, AltReg: 0.7613, CorReg: 0.0903, TopReg: 0.5951, AllReg: 0.7613, BotRReg: 0.7895, OV: 0.3109, AltV: 0.0683, CorV: 0.6748, TopV: 0.2016, BotRV: 0.0072, AllV: 0.0683 +[2026-01-29T21:35:00.289190Z] Loop 454: Reg: 0.4928, AltReg: 0.7613, CorReg: 0.0902, TopReg: 0.5945, AllReg: 0.7613, BotRReg: 0.7895, OV: 0.3110, AltV: 0.0683, CorV: 0.6750, TopV: 0.2022, BotRV: 0.0072, AllV: 0.0683 +[2026-01-29T21:35:02.653110Z] Loop 456: Reg: 0.4925, AltReg: 0.7612, CorReg: 0.0895, TopReg: 0.5860, AllReg: 0.7612, BotRReg: 0.7901, OV: 0.3112, AltV: 0.0683, CorV: 0.6756, TopV: 0.2107, BotRV: 0.0066, AllV: 0.0683 +[2026-01-29T21:35:05.013924Z] Loop 458: Reg: 0.4929, AltReg: 0.7613, CorReg: 0.0903, TopReg: 0.5789, AllReg: 0.7613, BotRReg: 0.7906, OV: 0.3109, AltV: 0.0683, CorV: 0.6748, TopV: 0.2178, BotRV: 0.0061, AllV: 0.0683 +[2026-01-29T21:35:07.386264Z] Loop 460: Reg: 0.4931, AltReg: 0.7613, CorReg: 0.0909, TopReg: 0.5763, AllReg: 0.7613, BotRReg: 0.7908, OV: 0.3106, AltV: 0.0683, CorV: 0.6742, TopV: 0.2204, BotRV: 0.0059, AllV: 0.0683 +[2026-01-29T21:35:09.755046Z] Loop 462: Reg: 0.4929, AltReg: 0.7613, CorReg: 0.0903, TopReg: 0.5786, AllReg: 0.7613, BotRReg: 0.7906, OV: 0.3109, AltV: 0.0683, CorV: 0.6748, TopV: 0.2180, BotRV: 0.0061, AllV: 0.0683 +[2026-01-29T21:35:12.124887Z] Loop 464: Reg: 0.4926, AltReg: 0.7612, CorReg: 0.0895, TopReg: 0.5843, AllReg: 0.7612, BotRReg: 0.7902, OV: 0.3112, AltV: 0.0683, CorV: 0.6756, TopV: 0.2124, BotRV: 0.0064, AllV: 0.0683 +[2026-01-29T21:35:14.510874Z] Loop 466: Reg: 0.4925, AltReg: 0.7612, CorReg: 0.0895, TopReg: 0.5875, AllReg: 0.7612, BotRReg: 0.7900, OV: 0.3113, AltV: 0.0683, CorV: 0.6757, TopV: 0.2092, BotRV: 0.0067, AllV: 0.0683 +[2026-01-29T21:35:16.884704Z] Loop 468: Reg: 0.4925, AltReg: 0.7612, CorReg: 0.0895, TopReg: 0.5889, AllReg: 0.7612, BotRReg: 0.7899, OV: 0.3112, AltV: 0.0683, CorV: 0.6756, TopV: 0.2078, BotRV: 0.0068, AllV: 0.0683 +[2026-01-29T21:35:19.247184Z] Loop 470: Reg: 0.4925, AltReg: 0.7612, CorReg: 0.0895, TopReg: 0.5890, AllReg: 0.7612, BotRReg: 0.7899, OV: 0.3112, AltV: 0.0683, CorV: 0.6756, TopV: 0.2077, BotRV: 0.0068, AllV: 0.0683 +[2026-01-29T21:35:21.609209Z] Loop 472: Reg: 0.4925, AltReg: 0.7612, CorReg: 0.0895, TopReg: 0.5880, AllReg: 0.7612, BotRReg: 0.7900, OV: 0.3113, AltV: 0.0683, CorV: 0.6757, TopV: 0.2086, BotRV: 0.0067, AllV: 0.0683 +[2026-01-29T21:35:23.982164Z] Loop 474: Reg: 0.4925, AltReg: 0.7612, CorReg: 0.0894, TopReg: 0.5874, AllReg: 0.7612, BotRReg: 0.7900, OV: 0.3113, AltV: 0.0683, CorV: 0.6757, TopV: 0.2093, BotRV: 0.0067, AllV: 0.0683 +[2026-01-29T21:35:26.345627Z] Loop 476: Reg: 0.4925, AltReg: 0.7612, CorReg: 0.0894, TopReg: 0.5880, AllReg: 0.7612, BotRReg: 0.7900, OV: 0.3113, AltV: 0.0683, CorV: 0.6757, TopV: 0.2087, BotRV: 0.0067, AllV: 0.0683 +[2026-01-29T21:35:28.707313Z] Loop 478: Reg: 0.4925, AltReg: 0.7612, CorReg: 0.0895, TopReg: 0.5883, AllReg: 0.7612, BotRReg: 0.7900, OV: 0.3113, AltV: 0.0683, CorV: 0.6757, TopV: 0.2084, BotRV: 0.0067, AllV: 0.0683 +[2026-01-29T21:35:31.071484Z] Loop 480: Reg: 0.4925, AltReg: 0.7612, CorReg: 0.0894, TopReg: 0.5865, AllReg: 0.7612, BotRReg: 0.7901, OV: 0.3113, AltV: 0.0683, CorV: 0.6757, TopV: 0.2102, BotRV: 0.0066, AllV: 0.0683 +[2026-01-29T21:35:33.446820Z] Loop 482: Reg: 0.4925, AltReg: 0.7612, CorReg: 0.0895, TopReg: 0.5861, AllReg: 0.7612, BotRReg: 0.7901, OV: 0.3113, AltV: 0.0683, CorV: 0.6757, TopV: 0.2106, BotRV: 0.0066, AllV: 0.0683 +[2026-01-29T21:35:35.809796Z] Loop 484: Reg: 0.4925, AltReg: 0.7612, CorReg: 0.0895, TopReg: 0.5854, AllReg: 0.7612, BotRReg: 0.7902, OV: 0.3112, AltV: 0.0683, CorV: 0.6756, TopV: 0.2113, BotRV: 0.0065, AllV: 0.0683 +[2026-01-29T21:35:38.175259Z] Loop 486: Reg: 0.4926, AltReg: 0.7612, CorReg: 0.0896, TopReg: 0.5832, AllReg: 0.7612, BotRReg: 0.7903, OV: 0.3112, AltV: 0.0683, CorV: 0.6755, TopV: 0.2135, BotRV: 0.0064, AllV: 0.0683 +[2026-01-29T21:35:40.536339Z] Loop 488: Reg: 0.4926, AltReg: 0.7612, CorReg: 0.0895, TopReg: 0.5839, AllReg: 0.7612, BotRReg: 0.7903, OV: 0.3112, AltV: 0.0683, CorV: 0.6756, TopV: 0.2128, BotRV: 0.0064, AllV: 0.0683 +[2026-01-29T21:35:42.895849Z] Loop 490: Reg: 0.4926, AltReg: 0.7612, CorReg: 0.0895, TopReg: 0.5898, AllReg: 0.7612, BotRReg: 0.7899, OV: 0.3112, AltV: 0.0683, CorV: 0.6756, TopV: 0.2069, BotRV: 0.0068, AllV: 0.0683 +[2026-01-29T21:35:45.259816Z] Loop 492: Reg: 0.4927, AltReg: 0.7613, CorReg: 0.0897, TopReg: 0.5923, AllReg: 0.7613, BotRReg: 0.7897, OV: 0.3111, AltV: 0.0683, CorV: 0.6754, TopV: 0.2044, BotRV: 0.0070, AllV: 0.0683 +[2026-01-29T21:35:47.631986Z] Loop 494: Reg: 0.4926, AltReg: 0.7613, CorReg: 0.0897, TopReg: 0.5919, AllReg: 0.7613, BotRReg: 0.7897, OV: 0.3112, AltV: 0.0683, CorV: 0.6754, TopV: 0.2048, BotRV: 0.0070, AllV: 0.0683 +[2026-01-29T21:35:50.002834Z] Loop 496: Reg: 0.4925, AltReg: 0.7612, CorReg: 0.0894, TopReg: 0.5878, AllReg: 0.7612, BotRReg: 0.7900, OV: 0.3113, AltV: 0.0683, CorV: 0.6757, TopV: 0.2089, BotRV: 0.0067, AllV: 0.0683 +[2026-01-29T21:35:52.364180Z] Loop 498: Reg: 0.4926, AltReg: 0.7612, CorReg: 0.0897, TopReg: 0.5818, AllReg: 0.7612, BotRReg: 0.7904, OV: 0.3111, AltV: 0.0683, CorV: 0.6754, TopV: 0.2149, BotRV: 0.0063, AllV: 0.0683 +[2026-01-29T21:35:54.726563Z] Loop 500: Reg: 0.4933, AltReg: 0.7613, CorReg: 0.0913, TopReg: 0.5748, AllReg: 0.7613, BotRReg: 0.7908, OV: 0.3105, AltV: 0.0683, CorV: 0.6738, TopV: 0.2218, BotRV: 0.0058, AllV: 0.0683 +[2026-01-29T21:36:00.574278Z] Loop 505: Reg: 0.4931, AltReg: 0.7613, CorReg: 0.0907, TopReg: 0.5768, AllReg: 0.7613, BotRReg: 0.7907, OV: 0.3107, AltV: 0.0683, CorV: 0.6744, TopV: 0.2199, BotRV: 0.0060, AllV: 0.0683 +[2026-01-29T21:36:06.419649Z] Loop 510: Reg: 0.4932, AltReg: 0.7613, CorReg: 0.0911, TopReg: 0.5986, AllReg: 0.7613, BotRReg: 0.7892, OV: 0.3106, AltV: 0.0683, CorV: 0.6740, TopV: 0.1981, BotRV: 0.0075, AllV: 0.0683 +[2026-01-29T21:36:12.265894Z] Loop 515: Reg: 0.4926, AltReg: 0.7612, CorReg: 0.0896, TopReg: 0.5907, AllReg: 0.7612, BotRReg: 0.7898, OV: 0.3112, AltV: 0.0683, CorV: 0.6756, TopV: 0.2060, BotRV: 0.0069, AllV: 0.0683 +[2026-01-29T21:36:18.111593Z] Loop 520: Reg: 0.4933, AltReg: 0.7613, CorReg: 0.0913, TopReg: 0.5750, AllReg: 0.7613, BotRReg: 0.7908, OV: 0.3105, AltV: 0.0683, CorV: 0.6739, TopV: 0.2217, BotRV: 0.0059, AllV: 0.0683 +[2026-01-29T21:36:23.959674Z] Loop 525: Reg: 0.4928, AltReg: 0.7613, CorReg: 0.0901, TopReg: 0.5794, AllReg: 0.7613, BotRReg: 0.7906, OV: 0.3110, AltV: 0.0683, CorV: 0.6750, TopV: 0.2173, BotRV: 0.0061, AllV: 0.0683 +[2026-01-29T21:36:29.795888Z] Loop 530: Reg: 0.4929, AltReg: 0.7613, CorReg: 0.0904, TopReg: 0.5961, AllReg: 0.7613, BotRReg: 0.7894, OV: 0.3108, AltV: 0.0683, CorV: 0.6747, TopV: 0.2006, BotRV: 0.0073, AllV: 0.0683 +[2026-01-29T21:36:35.631701Z] Loop 535: Reg: 0.4930, AltReg: 0.7613, CorReg: 0.0907, TopReg: 0.5974, AllReg: 0.7613, BotRReg: 0.7893, OV: 0.3107, AltV: 0.0683, CorV: 0.6744, TopV: 0.1993, BotRV: 0.0074, AllV: 0.0683 +[2026-01-29T21:36:41.474487Z] Loop 540: Reg: 0.4925, AltReg: 0.7613, CorReg: 0.0894, TopReg: 0.5894, AllReg: 0.7613, BotRReg: 0.7899, OV: 0.3113, AltV: 0.0683, CorV: 0.6758, TopV: 0.2073, BotRV: 0.0068, AllV: 0.0683 +[2026-01-29T21:36:47.346866Z] Loop 545: Reg: 0.4927, AltReg: 0.7613, CorReg: 0.0899, TopReg: 0.5801, AllReg: 0.7613, BotRReg: 0.7905, OV: 0.3111, AltV: 0.0683, CorV: 0.6752, TopV: 0.2166, BotRV: 0.0062, AllV: 0.0683 +[2026-01-29T21:36:53.205589Z] Loop 550: Reg: 0.4925, AltReg: 0.7613, CorReg: 0.0894, TopReg: 0.5904, AllReg: 0.7613, BotRReg: 0.7898, OV: 0.3113, AltV: 0.0683, CorV: 0.6757, TopV: 0.2063, BotRV: 0.0069, AllV: 0.0683 +[2026-01-29T21:36:59.069798Z] Loop 555: Reg: 0.4933, AltReg: 0.7613, CorReg: 0.0913, TopReg: 0.6000, AllReg: 0.7613, BotRReg: 0.7891, OV: 0.3104, AltV: 0.0682, CorV: 0.6738, TopV: 0.1967, BotRV: 0.0076, AllV: 0.0682 +[2026-01-29T21:37:04.921661Z] Loop 560: Reg: 0.4926, AltReg: 0.7613, CorReg: 0.0897, TopReg: 0.5929, AllReg: 0.7613, BotRReg: 0.7896, OV: 0.3111, AltV: 0.0683, CorV: 0.6754, TopV: 0.2038, BotRV: 0.0070, AllV: 0.0683 +[2026-01-29T21:37:10.771479Z] Loop 565: Reg: 0.4925, AltReg: 0.7612, CorReg: 0.0893, TopReg: 0.5876, AllReg: 0.7612, BotRReg: 0.7900, OV: 0.3113, AltV: 0.0683, CorV: 0.6758, TopV: 0.2091, BotRV: 0.0067, AllV: 0.0683 +[2026-01-29T21:37:16.628998Z] Loop 570: Reg: 0.4925, AltReg: 0.7612, CorReg: 0.0895, TopReg: 0.5836, AllReg: 0.7612, BotRReg: 0.7903, OV: 0.3112, AltV: 0.0683, CorV: 0.6756, TopV: 0.2131, BotRV: 0.0064, AllV: 0.0683 +[2026-01-29T21:37:22.482629Z] Loop 575: Reg: 0.4925, AltReg: 0.7612, CorReg: 0.0893, TopReg: 0.5881, AllReg: 0.7612, BotRReg: 0.7900, OV: 0.3113, AltV: 0.0683, CorV: 0.6758, TopV: 0.2086, BotRV: 0.0067, AllV: 0.0683 +[2026-01-29T21:37:28.323830Z] Loop 580: Reg: 0.4925, AltReg: 0.7612, CorReg: 0.0894, TopReg: 0.5898, AllReg: 0.7612, BotRReg: 0.7899, OV: 0.3113, AltV: 0.0683, CorV: 0.6757, TopV: 0.2069, BotRV: 0.0068, AllV: 0.0683 +[2026-01-29T21:37:34.174506Z] Loop 585: Reg: 0.4925, AltReg: 0.7612, CorReg: 0.0893, TopReg: 0.5855, AllReg: 0.7612, BotRReg: 0.7902, OV: 0.3113, AltV: 0.0683, CorV: 0.6758, TopV: 0.2112, BotRV: 0.0065, AllV: 0.0683 +[2026-01-29T21:37:40.015410Z] Loop 590: Reg: 0.4929, AltReg: 0.7613, CorReg: 0.0904, TopReg: 0.5772, AllReg: 0.7613, BotRReg: 0.7907, OV: 0.3108, AltV: 0.0683, CorV: 0.6747, TopV: 0.2195, BotRV: 0.0060, AllV: 0.0683 +[2026-01-29T21:37:45.855365Z] Loop 595: Reg: 0.4929, AltReg: 0.7613, CorReg: 0.0902, TopReg: 0.5779, AllReg: 0.7613, BotRReg: 0.7907, OV: 0.3109, AltV: 0.0683, CorV: 0.6749, TopV: 0.2188, BotRV: 0.0060, AllV: 0.0683 +[2026-01-29T21:37:51.699986Z] Loop 600: Reg: 0.4924, AltReg: 0.7613, CorReg: 0.0891, TopReg: 0.5873, AllReg: 0.7613, BotRReg: 0.7900, OV: 0.3114, AltV: 0.0683, CorV: 0.6760, TopV: 0.2094, BotRV: 0.0066, AllV: 0.0683 +[2026-01-29T21:37:57.544270Z] Loop 605: Reg: 0.4926, AltReg: 0.7613, CorReg: 0.0896, TopReg: 0.5937, AllReg: 0.7613, BotRReg: 0.7896, OV: 0.3112, AltV: 0.0683, CorV: 0.6755, TopV: 0.2030, BotRV: 0.0071, AllV: 0.0683 +[2026-01-29T21:38:03.382220Z] Loop 610: Reg: 0.4924, AltReg: 0.7613, CorReg: 0.0892, TopReg: 0.5841, AllReg: 0.7613, BotRReg: 0.7903, OV: 0.3113, AltV: 0.0683, CorV: 0.6759, TopV: 0.2126, BotRV: 0.0064, AllV: 0.0683 +[2026-01-29T21:38:09.229077Z] Loop 615: Reg: 0.4924, AltReg: 0.7613, CorReg: 0.0892, TopReg: 0.5841, AllReg: 0.7613, BotRReg: 0.7903, OV: 0.3113, AltV: 0.0683, CorV: 0.6759, TopV: 0.2126, BotRV: 0.0064, AllV: 0.0683 +[2026-01-29T21:38:15.074474Z] Loop 620: Reg: 0.4925, AltReg: 0.7613, CorReg: 0.0894, TopReg: 0.5924, AllReg: 0.7613, BotRReg: 0.7897, OV: 0.3112, AltV: 0.0683, CorV: 0.6757, TopV: 0.2043, BotRV: 0.0070, AllV: 0.0683 +[2026-01-29T21:38:20.915102Z] Loop 625: Reg: 0.4925, AltReg: 0.7613, CorReg: 0.0894, TopReg: 0.5821, AllReg: 0.7613, BotRReg: 0.7904, OV: 0.3113, AltV: 0.0683, CorV: 0.6758, TopV: 0.2146, BotRV: 0.0063, AllV: 0.0683 +[2026-01-29T21:38:26.757008Z] Loop 630: Reg: 0.4924, AltReg: 0.7613, CorReg: 0.0892, TopReg: 0.5836, AllReg: 0.7613, BotRReg: 0.7903, OV: 0.3114, AltV: 0.0683, CorV: 0.6759, TopV: 0.2131, BotRV: 0.0064, AllV: 0.0683 +[2026-01-29T21:38:32.607827Z] Loop 635: Reg: 0.4926, AltReg: 0.7613, CorReg: 0.0896, TopReg: 0.5945, AllReg: 0.7613, BotRReg: 0.7895, OV: 0.3111, AltV: 0.0683, CorV: 0.6755, TopV: 0.2021, BotRV: 0.0071, AllV: 0.0683 +[2026-01-29T21:38:38.452369Z] Loop 640: Reg: 0.4924, AltReg: 0.7613, CorReg: 0.0891, TopReg: 0.5910, AllReg: 0.7613, BotRReg: 0.7898, OV: 0.3114, AltV: 0.0683, CorV: 0.6760, TopV: 0.2057, BotRV: 0.0069, AllV: 0.0683 +[2026-01-29T21:38:44.301368Z] Loop 645: Reg: 0.4929, AltReg: 0.7613, CorReg: 0.0903, TopReg: 0.5769, AllReg: 0.7613, BotRReg: 0.7907, OV: 0.3109, AltV: 0.0682, CorV: 0.6749, TopV: 0.2198, BotRV: 0.0060, AllV: 0.0682 +[2026-01-29T21:38:50.146377Z] Loop 650: Reg: 0.4928, AltReg: 0.7613, CorReg: 0.0901, TopReg: 0.5774, AllReg: 0.7613, BotRReg: 0.7907, OV: 0.3110, AltV: 0.0682, CorV: 0.6751, TopV: 0.2192, BotRV: 0.0060, AllV: 0.0682 +[2026-01-29T21:38:55.987139Z] Loop 655: Reg: 0.4923, AltReg: 0.7613, CorReg: 0.0888, TopReg: 0.5873, AllReg: 0.7613, BotRReg: 0.7901, OV: 0.3115, AltV: 0.0683, CorV: 0.6763, TopV: 0.2094, BotRV: 0.0066, AllV: 0.0683 +[2026-01-29T21:39:01.830008Z] Loop 660: Reg: 0.4924, AltReg: 0.7613, CorReg: 0.0890, TopReg: 0.5916, AllReg: 0.7613, BotRReg: 0.7898, OV: 0.3114, AltV: 0.0682, CorV: 0.6761, TopV: 0.2051, BotRV: 0.0069, AllV: 0.0682 +[2026-01-29T21:39:07.695635Z] Loop 665: Reg: 0.4923, AltReg: 0.7613, CorReg: 0.0887, TopReg: 0.5888, AllReg: 0.7613, BotRReg: 0.7900, OV: 0.3115, AltV: 0.0682, CorV: 0.6764, TopV: 0.2079, BotRV: 0.0067, AllV: 0.0682 +[2026-01-29T21:39:13.543832Z] Loop 670: Reg: 0.4923, AltReg: 0.7613, CorReg: 0.0887, TopReg: 0.5858, AllReg: 0.7613, BotRReg: 0.7902, OV: 0.3115, AltV: 0.0682, CorV: 0.6764, TopV: 0.2109, BotRV: 0.0065, AllV: 0.0682 +[2026-01-29T21:39:19.406137Z] Loop 675: Reg: 0.4923, AltReg: 0.7613, CorReg: 0.0887, TopReg: 0.5842, AllReg: 0.7613, BotRReg: 0.7903, OV: 0.3115, AltV: 0.0682, CorV: 0.6764, TopV: 0.2124, BotRV: 0.0064, AllV: 0.0682 +[2026-01-29T21:39:25.260963Z] Loop 680: Reg: 0.4922, AltReg: 0.7613, CorReg: 0.0886, TopReg: 0.5870, AllReg: 0.7613, BotRReg: 0.7901, OV: 0.3116, AltV: 0.0682, CorV: 0.6765, TopV: 0.2097, BotRV: 0.0066, AllV: 0.0682 +[2026-01-29T21:39:31.103767Z] Loop 685: Reg: 0.4923, AltReg: 0.7613, CorReg: 0.0888, TopReg: 0.5832, AllReg: 0.7613, BotRReg: 0.7903, OV: 0.3115, AltV: 0.0682, CorV: 0.6763, TopV: 0.2135, BotRV: 0.0063, AllV: 0.0682 +[2026-01-29T21:39:36.950155Z] Loop 690: Reg: 0.4922, AltReg: 0.7613, CorReg: 0.0885, TopReg: 0.5891, AllReg: 0.7613, BotRReg: 0.7899, OV: 0.3116, AltV: 0.0682, CorV: 0.6766, TopV: 0.2076, BotRV: 0.0067, AllV: 0.0682 +[2026-01-29T21:39:42.799080Z] Loop 695: Reg: 0.4922, AltReg: 0.7613, CorReg: 0.0885, TopReg: 0.5860, AllReg: 0.7613, BotRReg: 0.7902, OV: 0.3116, AltV: 0.0682, CorV: 0.6766, TopV: 0.2107, BotRV: 0.0065, AllV: 0.0682 +[2026-01-29T21:39:48.641704Z] Loop 700: Reg: 0.4929, AltReg: 0.7614, CorReg: 0.0902, TopReg: 0.5757, AllReg: 0.7614, BotRReg: 0.7908, OV: 0.3109, AltV: 0.0682, CorV: 0.6750, TopV: 0.2210, BotRV: 0.0059, AllV: 0.0682 +[2026-01-29T21:39:54.492946Z] Loop 705: Reg: 0.4921, AltReg: 0.7613, CorReg: 0.0884, TopReg: 0.5859, AllReg: 0.7613, BotRReg: 0.7902, OV: 0.3116, AltV: 0.0682, CorV: 0.6767, TopV: 0.2108, BotRV: 0.0065, AllV: 0.0682 +[2026-01-29T21:40:00.340094Z] Loop 710: Reg: 0.4926, AltReg: 0.7614, CorReg: 0.0894, TopReg: 0.5970, AllReg: 0.7614, BotRReg: 0.7894, OV: 0.3112, AltV: 0.0682, CorV: 0.6757, TopV: 0.1997, BotRV: 0.0073, AllV: 0.0682 +[2026-01-29T21:40:06.181541Z] Loop 715: Reg: 0.4921, AltReg: 0.7613, CorReg: 0.0884, TopReg: 0.5841, AllReg: 0.7613, BotRReg: 0.7903, OV: 0.3116, AltV: 0.0682, CorV: 0.6767, TopV: 0.2126, BotRV: 0.0064, AllV: 0.0682 +[2026-01-29T21:40:12.022516Z] Loop 720: Reg: 0.4923, AltReg: 0.7613, CorReg: 0.0888, TopReg: 0.5806, AllReg: 0.7613, BotRReg: 0.7905, OV: 0.3115, AltV: 0.0682, CorV: 0.6763, TopV: 0.2161, BotRV: 0.0062, AllV: 0.0682 +[2026-01-29T21:40:17.866240Z] Loop 725: Reg: 0.4921, AltReg: 0.7613, CorReg: 0.0883, TopReg: 0.5902, AllReg: 0.7613, BotRReg: 0.7899, OV: 0.3117, AltV: 0.0682, CorV: 0.6769, TopV: 0.2065, BotRV: 0.0068, AllV: 0.0682 +[2026-01-29T21:40:23.713856Z] Loop 730: Reg: 0.4922, AltReg: 0.7613, CorReg: 0.0884, TopReg: 0.5825, AllReg: 0.7613, BotRReg: 0.7904, OV: 0.3116, AltV: 0.0682, CorV: 0.6767, TopV: 0.2142, BotRV: 0.0063, AllV: 0.0682 +[2026-01-29T21:40:29.561745Z] Loop 735: Reg: 0.4921, AltReg: 0.7613, CorReg: 0.0883, TopReg: 0.5829, AllReg: 0.7613, BotRReg: 0.7904, OV: 0.3117, AltV: 0.0682, CorV: 0.6768, TopV: 0.2138, BotRV: 0.0063, AllV: 0.0682 +[2026-01-29T21:40:35.405931Z] Loop 740: Reg: 0.4920, AltReg: 0.7613, CorReg: 0.0880, TopReg: 0.5903, AllReg: 0.7613, BotRReg: 0.7899, OV: 0.3118, AltV: 0.0682, CorV: 0.6771, TopV: 0.2064, BotRV: 0.0068, AllV: 0.0682 +[2026-01-29T21:40:41.246415Z] Loop 745: Reg: 0.4920, AltReg: 0.7613, CorReg: 0.0879, TopReg: 0.5860, AllReg: 0.7613, BotRReg: 0.7902, OV: 0.3118, AltV: 0.0682, CorV: 0.6772, TopV: 0.2107, BotRV: 0.0065, AllV: 0.0682 +[2026-01-29T21:40:47.089024Z] Loop 750: Reg: 0.4920, AltReg: 0.7613, CorReg: 0.0879, TopReg: 0.5843, AllReg: 0.7613, BotRReg: 0.7903, OV: 0.3118, AltV: 0.0682, CorV: 0.6772, TopV: 0.2124, BotRV: 0.0064, AllV: 0.0682 +[2026-01-29T21:40:52.938923Z] Loop 755: Reg: 0.4919, AltReg: 0.7614, CorReg: 0.0878, TopReg: 0.5896, AllReg: 0.7614, BotRReg: 0.7899, OV: 0.3119, AltV: 0.0682, CorV: 0.6774, TopV: 0.2071, BotRV: 0.0067, AllV: 0.0682 +[2026-01-29T21:40:58.777177Z] Loop 760: Reg: 0.4919, AltReg: 0.7614, CorReg: 0.0877, TopReg: 0.5899, AllReg: 0.7614, BotRReg: 0.7899, OV: 0.3119, AltV: 0.0682, CorV: 0.6774, TopV: 0.2067, BotRV: 0.0068, AllV: 0.0682 +[2026-01-29T21:41:04.618051Z] Loop 765: Reg: 0.4922, AltReg: 0.7614, CorReg: 0.0885, TopReg: 0.5793, AllReg: 0.7614, BotRReg: 0.7906, OV: 0.3116, AltV: 0.0682, CorV: 0.6766, TopV: 0.2174, BotRV: 0.0061, AllV: 0.0682 +[2026-01-29T21:41:10.460568Z] Loop 770: Reg: 0.4920, AltReg: 0.7614, CorReg: 0.0879, TopReg: 0.5935, AllReg: 0.7614, BotRReg: 0.7897, OV: 0.3118, AltV: 0.0682, CorV: 0.6773, TopV: 0.2032, BotRV: 0.0070, AllV: 0.0682 +[2026-01-29T21:41:16.320609Z] Loop 775: Reg: 0.4918, AltReg: 0.7614, CorReg: 0.0874, TopReg: 0.5904, AllReg: 0.7614, BotRReg: 0.7899, OV: 0.3120, AltV: 0.0682, CorV: 0.6777, TopV: 0.2063, BotRV: 0.0068, AllV: 0.0682 +[2026-01-29T21:41:22.181004Z] Loop 780: Reg: 0.4919, AltReg: 0.7614, CorReg: 0.0878, TopReg: 0.5813, AllReg: 0.7614, BotRReg: 0.7905, OV: 0.3118, AltV: 0.0682, CorV: 0.6773, TopV: 0.2154, BotRV: 0.0062, AllV: 0.0682 +[2026-01-29T21:41:28.035514Z] Loop 785: Reg: 0.4917, AltReg: 0.7614, CorReg: 0.0872, TopReg: 0.5853, AllReg: 0.7614, BotRReg: 0.7902, OV: 0.3121, AltV: 0.0682, CorV: 0.6779, TopV: 0.2114, BotRV: 0.0064, AllV: 0.0682 +[2026-01-29T21:41:33.885366Z] Loop 790: Reg: 0.4916, AltReg: 0.7614, CorReg: 0.0870, TopReg: 0.5900, AllReg: 0.7614, BotRReg: 0.7899, OV: 0.3121, AltV: 0.0682, CorV: 0.6781, TopV: 0.2067, BotRV: 0.0067, AllV: 0.0682 +[2026-01-29T21:41:39.742062Z] Loop 795: Reg: 0.4916, AltReg: 0.7614, CorReg: 0.0869, TopReg: 0.5903, AllReg: 0.7614, BotRReg: 0.7899, OV: 0.3122, AltV: 0.0682, CorV: 0.6782, TopV: 0.2064, BotRV: 0.0068, AllV: 0.0682 +[2026-01-29T21:41:45.586188Z] Loop 800: Reg: 0.4916, AltReg: 0.7614, CorReg: 0.0869, TopReg: 0.5923, AllReg: 0.7614, BotRReg: 0.7898, OV: 0.3122, AltV: 0.0682, CorV: 0.6782, TopV: 0.2044, BotRV: 0.0069, AllV: 0.0682 +[2026-01-29T21:41:51.426690Z] Loop 805: Reg: 0.4914, AltReg: 0.7614, CorReg: 0.0865, TopReg: 0.5885, AllReg: 0.7614, BotRReg: 0.7901, OV: 0.3123, AltV: 0.0682, CorV: 0.6786, TopV: 0.2082, BotRV: 0.0066, AllV: 0.0682 +[2026-01-29T21:41:57.275112Z] Loop 810: Reg: 0.4915, AltReg: 0.7614, CorReg: 0.0866, TopReg: 0.5934, AllReg: 0.7614, BotRReg: 0.7897, OV: 0.3123, AltV: 0.0682, CorV: 0.6785, TopV: 0.2033, BotRV: 0.0070, AllV: 0.0682 +[2026-01-29T21:42:03.115649Z] Loop 815: Reg: 0.4914, AltReg: 0.7614, CorReg: 0.0864, TopReg: 0.5832, AllReg: 0.7614, BotRReg: 0.7904, OV: 0.3124, AltV: 0.0681, CorV: 0.6787, TopV: 0.2135, BotRV: 0.0063, AllV: 0.0681 +[2026-01-29T21:42:08.963674Z] Loop 820: Reg: 0.4923, AltReg: 0.7615, CorReg: 0.0884, TopReg: 0.5745, AllReg: 0.7615, BotRReg: 0.7910, OV: 0.3115, AltV: 0.0681, CorV: 0.6767, TopV: 0.2222, BotRV: 0.0057, AllV: 0.0681 +[2026-01-29T21:42:14.810329Z] Loop 825: Reg: 0.4914, AltReg: 0.7614, CorReg: 0.0863, TopReg: 0.5810, AllReg: 0.7614, BotRReg: 0.7906, OV: 0.3124, AltV: 0.0681, CorV: 0.6788, TopV: 0.2157, BotRV: 0.0061, AllV: 0.0681 +[2026-01-29T21:42:20.655304Z] Loop 830: Reg: 0.4924, AltReg: 0.7614, CorReg: 0.0888, TopReg: 0.6040, AllReg: 0.7614, BotRReg: 0.7890, OV: 0.3114, AltV: 0.0681, CorV: 0.6763, TopV: 0.1926, BotRV: 0.0077, AllV: 0.0681 +[2026-01-29T21:42:26.507704Z] Loop 835: Reg: 0.4909, AltReg: 0.7614, CorReg: 0.0851, TopReg: 0.5895, AllReg: 0.7614, BotRReg: 0.7900, OV: 0.3129, AltV: 0.0681, CorV: 0.6800, TopV: 0.2072, BotRV: 0.0067, AllV: 0.0681 +[2026-01-29T21:42:32.354658Z] Loop 840: Reg: 0.4915, AltReg: 0.7615, CorReg: 0.0865, TopReg: 0.5776, AllReg: 0.7615, BotRReg: 0.7908, OV: 0.3123, AltV: 0.0681, CorV: 0.6786, TopV: 0.2191, BotRV: 0.0059, AllV: 0.0681 +[2026-01-29T21:42:38.198062Z] Loop 845: Reg: 0.4908, AltReg: 0.7614, CorReg: 0.0848, TopReg: 0.5943, AllReg: 0.7614, BotRReg: 0.7897, OV: 0.3130, AltV: 0.0681, CorV: 0.6803, TopV: 0.2024, BotRV: 0.0070, AllV: 0.0681 +[2026-01-29T21:42:44.043835Z] Loop 850: Reg: 0.4918, AltReg: 0.7616, CorReg: 0.0871, TopReg: 0.6052, AllReg: 0.7616, BotRReg: 0.7890, OV: 0.3120, AltV: 0.0680, CorV: 0.6780, TopV: 0.1914, BotRV: 0.0077, AllV: 0.0680 +[2026-01-29T21:42:49.885296Z] Loop 855: Reg: 0.4916, AltReg: 0.7615, CorReg: 0.0868, TopReg: 0.5744, AllReg: 0.7615, BotRReg: 0.7910, OV: 0.3121, AltV: 0.0680, CorV: 0.6783, TopV: 0.2223, BotRV: 0.0057, AllV: 0.0680 +[2026-01-29T21:42:55.728071Z] Loop 860: Reg: 0.4904, AltReg: 0.7614, CorReg: 0.0838, TopReg: 0.5943, AllReg: 0.7614, BotRReg: 0.7898, OV: 0.3134, AltV: 0.0681, CorV: 0.6813, TopV: 0.2024, BotRV: 0.0069, AllV: 0.0681 +[2026-01-29T21:43:01.577478Z] Loop 865: Reg: 0.4907, AltReg: 0.7615, CorReg: 0.0845, TopReg: 0.6007, AllReg: 0.7615, BotRReg: 0.7893, OV: 0.3131, AltV: 0.0681, CorV: 0.6806, TopV: 0.1960, BotRV: 0.0074, AllV: 0.0681 +[2026-01-29T21:43:07.429028Z] Loop 870: Reg: 0.4900, AltReg: 0.7615, CorReg: 0.0828, TopReg: 0.5871, AllReg: 0.7615, BotRReg: 0.7903, OV: 0.3138, AltV: 0.0681, CorV: 0.6823, TopV: 0.2096, BotRV: 0.0064, AllV: 0.0681 +[2026-01-29T21:43:13.281799Z] Loop 875: Reg: 0.4897, AltReg: 0.7615, CorReg: 0.0821, TopReg: 0.5908, AllReg: 0.7615, BotRReg: 0.7901, OV: 0.3141, AltV: 0.0681, CorV: 0.6830, TopV: 0.2059, BotRV: 0.0066, AllV: 0.0681 +[2026-01-29T21:43:19.131240Z] Loop 880: Reg: 0.4895, AltReg: 0.7615, CorReg: 0.0815, TopReg: 0.5900, AllReg: 0.7615, BotRReg: 0.7901, OV: 0.3143, AltV: 0.0681, CorV: 0.6837, TopV: 0.2067, BotRV: 0.0066, AllV: 0.0681 +[2026-01-29T21:43:24.979284Z] Loop 885: Reg: 0.4893, AltReg: 0.7615, CorReg: 0.0810, TopReg: 0.5862, AllReg: 0.7615, BotRReg: 0.7904, OV: 0.3145, AltV: 0.0681, CorV: 0.6841, TopV: 0.2105, BotRV: 0.0063, AllV: 0.0681 +[2026-01-29T21:43:30.826322Z] Loop 890: Reg: 0.4895, AltReg: 0.7615, CorReg: 0.0814, TopReg: 0.6034, AllReg: 0.7615, BotRReg: 0.7892, OV: 0.3143, AltV: 0.0681, CorV: 0.6837, TopV: 0.1933, BotRV: 0.0074, AllV: 0.0681 +[2026-01-29T21:43:36.674325Z] Loop 895: Reg: 0.4884, AltReg: 0.7615, CorReg: 0.0788, TopReg: 0.5915, AllReg: 0.7615, BotRReg: 0.7901, OV: 0.3154, AltV: 0.0681, CorV: 0.6863, TopV: 0.2052, BotRV: 0.0066, AllV: 0.0681 +[2026-01-29T21:43:42.516611Z] Loop 900: Reg: 0.4881, AltReg: 0.7615, CorReg: 0.0780, TopReg: 0.5890, AllReg: 0.7615, BotRReg: 0.7903, OV: 0.3157, AltV: 0.0681, CorV: 0.6871, TopV: 0.2077, BotRV: 0.0064, AllV: 0.0681 +[2026-01-29T21:43:48.356381Z] Loop 905: Reg: 0.4886, AltReg: 0.7615, CorReg: 0.0792, TopReg: 0.6078, AllReg: 0.7615, BotRReg: 0.7890, OV: 0.3152, AltV: 0.0681, CorV: 0.6859, TopV: 0.1889, BotRV: 0.0077, AllV: 0.0681 +[2026-01-29T21:43:54.203306Z] Loop 910: Reg: 0.4871, AltReg: 0.7614, CorReg: 0.0755, TopReg: 0.5908, AllReg: 0.7614, BotRReg: 0.7903, OV: 0.3167, AltV: 0.0681, CorV: 0.6896, TopV: 0.2059, BotRV: 0.0064, AllV: 0.0681 +[2026-01-29T21:44:00.045541Z] Loop 915: Reg: 0.4864, AltReg: 0.7614, CorReg: 0.0739, TopReg: 0.5990, AllReg: 0.7614, BotRReg: 0.7897, OV: 0.3174, AltV: 0.0682, CorV: 0.6912, TopV: 0.1977, BotRV: 0.0069, AllV: 0.0682 +[2026-01-29T21:44:05.887331Z] Loop 920: Reg: 0.4856, AltReg: 0.7614, CorReg: 0.0720, TopReg: 0.5923, AllReg: 0.7614, BotRReg: 0.7903, OV: 0.3182, AltV: 0.0682, CorV: 0.6931, TopV: 0.2044, BotRV: 0.0064, AllV: 0.0682 +[2026-01-29T21:44:11.731949Z] Loop 925: Reg: 0.4847, AltReg: 0.7613, CorReg: 0.0697, TopReg: 0.6044, AllReg: 0.7613, BotRReg: 0.7895, OV: 0.3191, AltV: 0.0683, CorV: 0.6954, TopV: 0.1923, BotRV: 0.0072, AllV: 0.0683 +[2026-01-29T21:44:17.584906Z] Loop 930: Reg: 0.4843, AltReg: 0.7614, CorReg: 0.0687, TopReg: 0.5846, AllReg: 0.7614, BotRReg: 0.7909, OV: 0.3195, AltV: 0.0682, CorV: 0.6964, TopV: 0.2121, BotRV: 0.0058, AllV: 0.0682 +[2026-01-29T21:44:23.436100Z] Loop 935: Reg: 0.4826, AltReg: 0.7612, CorReg: 0.0647, TopReg: 0.6150, AllReg: 0.7612, BotRReg: 0.7889, OV: 0.3212, AltV: 0.0684, CorV: 0.7004, TopV: 0.1816, BotRV: 0.0077, AllV: 0.0684 +[2026-01-29T21:44:29.278807Z] Loop 940: Reg: 0.4809, AltReg: 0.7613, CorReg: 0.0605, TopReg: 0.5925, AllReg: 0.7613, BotRReg: 0.7907, OV: 0.3228, AltV: 0.0683, CorV: 0.7047, TopV: 0.2042, BotRV: 0.0060, AllV: 0.0683 +[2026-01-29T21:44:35.121929Z] Loop 945: Reg: 0.4785, AltReg: 0.7610, CorReg: 0.0548, TopReg: 0.6190, AllReg: 0.7610, BotRReg: 0.7890, OV: 0.3252, AltV: 0.0685, CorV: 0.7103, TopV: 0.1777, BotRV: 0.0077, AllV: 0.0685 +[2026-01-29T21:44:40.964363Z] Loop 950: Reg: 0.4762, AltReg: 0.7609, CorReg: 0.0491, TopReg: 0.6131, AllReg: 0.7609, BotRReg: 0.7897, OV: 0.3276, AltV: 0.0686, CorV: 0.7161, TopV: 0.1836, BotRV: 0.0070, AllV: 0.0686 +[2026-01-29T21:44:46.803241Z] Loop 955: Reg: 0.4742, AltReg: 0.7607, CorReg: 0.0444, TopReg: 0.6110, AllReg: 0.7607, BotRReg: 0.7900, OV: 0.3296, AltV: 0.0688, CorV: 0.7207, TopV: 0.1857, BotRV: 0.0067, AllV: 0.0688 +[2026-01-29T21:44:52.656174Z] Loop 960: Reg: 0.4721, AltReg: 0.7602, CorReg: 0.0399, TopReg: 0.6324, AllReg: 0.7602, BotRReg: 0.7885, OV: 0.3317, AltV: 0.0694, CorV: 0.7252, TopV: 0.1643, BotRV: 0.0082, AllV: 0.0694 +[2026-01-29T21:44:58.499070Z] Loop 965: Reg: 0.4740, AltReg: 0.7604, CorReg: 0.0445, TopReg: 0.5939, AllReg: 0.7604, BotRReg: 0.7915, OV: 0.3298, AltV: 0.0692, CorV: 0.7207, TopV: 0.2028, BotRV: 0.0052, AllV: 0.0692 +[2026-01-29T21:45:04.343029Z] Loop 970: Reg: 0.4749, AltReg: 0.7593, CorReg: 0.0483, TopReg: 0.6674, AllReg: 0.7593, BotRReg: 0.7842, OV: 0.3289, AltV: 0.0702, CorV: 0.7168, TopV: 0.1293, BotRV: 0.0125, AllV: 0.0702 +[2026-01-29T21:45:10.185273Z] Loop 975: Reg: 0.4676, AltReg: 0.7589, CorReg: 0.0308, TopReg: 0.6113, AllReg: 0.7589, BotRReg: 0.7906, OV: 0.3362, AltV: 0.0707, CorV: 0.7344, TopV: 0.1854, BotRV: 0.0061, AllV: 0.0707 +[2026-01-29T21:45:16.032308Z] Loop 980: Reg: 0.4660, AltReg: 0.7574, CorReg: 0.0288, TopReg: 0.6640, AllReg: 0.7574, BotRReg: 0.7846, OV: 0.3378, AltV: 0.0721, CorV: 0.7363, TopV: 0.1327, BotRV: 0.0121, AllV: 0.0721 +[2026-01-29T21:45:21.878718Z] Loop 985: Reg: 0.4627, AltReg: 0.7568, CorReg: 0.0215, TopReg: 0.6259, AllReg: 0.7568, BotRReg: 0.7892, OV: 0.3411, AltV: 0.0728, CorV: 0.7436, TopV: 0.1708, BotRV: 0.0075, AllV: 0.0728 +[2026-01-29T21:45:27.732092Z] Loop 990: Reg: 0.4596, AltReg: 0.7551, CorReg: 0.0163, TopReg: 0.6424, AllReg: 0.7551, BotRReg: 0.7870, OV: 0.3442, AltV: 0.0744, CorV: 0.7488, TopV: 0.1543, BotRV: 0.0097, AllV: 0.0744 +[2026-01-29T21:45:33.579748Z] Loop 995: Reg: 0.4584, AltReg: 0.7535, CorReg: 0.0157, TopReg: 0.6622, AllReg: 0.7535, BotRReg: 0.7834, OV: 0.3454, AltV: 0.0761, CorV: 0.7494, TopV: 0.1345, BotRV: 0.0133, AllV: 0.0761 +[2026-01-29T21:45:39.424226Z] Loop 1000: Reg: 0.4565, AltReg: 0.7523, CorReg: 0.0129, TopReg: 0.6369, AllReg: 0.7523, BotRReg: 0.7865, OV: 0.3472, AltV: 0.0773, CorV: 0.7522, TopV: 0.1597, BotRV: 0.0102, AllV: 0.0773 +[2026-01-29T21:45:45.270187Z] Loop 1005: Reg: 0.4560, AltReg: 0.7510, CorReg: 0.0135, TopReg: 0.6251, AllReg: 0.7510, BotRReg: 0.7871, OV: 0.3478, AltV: 0.0786, CorV: 0.7517, TopV: 0.1716, BotRV: 0.0096, AllV: 0.0786 +[2026-01-29T21:45:51.119984Z] Loop 1010: Reg: 0.4583, AltReg: 0.7494, CorReg: 0.0218, TopReg: 0.6807, AllReg: 0.7494, BotRReg: 0.7759, OV: 0.3454, AltV: 0.0802, CorV: 0.7434, TopV: 0.1160, BotRV: 0.0208, AllV: 0.0802 +[2026-01-29T21:45:56.969640Z] Loop 1015: Reg: 0.4593, AltReg: 0.7497, CorReg: 0.0237, TopReg: 0.5896, AllReg: 0.7497, BotRReg: 0.7897, OV: 0.3444, AltV: 0.0798, CorV: 0.7414, TopV: 0.2070, BotRV: 0.0069, AllV: 0.0798 +[2026-01-29T21:46:02.817357Z] Loop 1020: Reg: 0.4508, AltReg: 0.7444, CorReg: 0.0105, TopReg: 0.6702, AllReg: 0.7444, BotRReg: 0.7766, OV: 0.3529, AltV: 0.0851, CorV: 0.7547, TopV: 0.1265, BotRV: 0.0201, AllV: 0.0851 +[2026-01-29T21:46:08.661111Z] Loop 1025: Reg: 0.4494, AltReg: 0.7434, CorReg: 0.0082, TopReg: 0.6174, AllReg: 0.7434, BotRReg: 0.7847, OV: 0.3544, AltV: 0.0861, CorV: 0.7569, TopV: 0.1793, BotRV: 0.0120, AllV: 0.0861 +[2026-01-29T21:46:14.522026Z] Loop 1030: Reg: 0.4461, AltReg: 0.7395, CorReg: 0.0059, TopReg: 0.6615, AllReg: 0.7395, BotRReg: 0.7751, OV: 0.3577, AltV: 0.0900, CorV: 0.7592, TopV: 0.1352, BotRV: 0.0215, AllV: 0.0900 +[2026-01-29T21:46:20.370182Z] Loop 1035: Reg: 0.4445, AltReg: 0.7374, CorReg: 0.0052, TopReg: 0.6607, AllReg: 0.7374, BotRReg: 0.7743, OV: 0.3592, AltV: 0.0921, CorV: 0.7599, TopV: 0.1360, BotRV: 0.0224, AllV: 0.0921 +[2026-01-29T21:46:26.218069Z] Loop 1040: Reg: 0.4497, AltReg: 0.7404, CorReg: 0.0136, TopReg: 0.5831, AllReg: 0.7404, BotRReg: 0.7867, OV: 0.3541, AltV: 0.0892, CorV: 0.7515, TopV: 0.2136, BotRV: 0.0100, AllV: 0.0892 +[2026-01-29T21:46:32.066754Z] Loop 1045: Reg: 0.4504, AltReg: 0.7383, CorReg: 0.0187, TopReg: 0.6869, AllReg: 0.7383, BotRReg: 0.7656, OV: 0.3533, AltV: 0.0913, CorV: 0.7464, TopV: 0.1098, BotRV: 0.0311, AllV: 0.0913 +[2026-01-29T21:46:37.922482Z] Loop 1050: Reg: 0.4400, AltReg: 0.7316, CorReg: 0.0026, TopReg: 0.6250, AllReg: 0.7316, BotRReg: 0.7776, OV: 0.3638, AltV: 0.0979, CorV: 0.7626, TopV: 0.1717, BotRV: 0.0191, AllV: 0.0979 +[2026-01-29T21:46:43.779204Z] Loop 1055: Reg: 0.4400, AltReg: 0.7310, CorReg: 0.0034, TopReg: 0.6083, AllReg: 0.7310, BotRReg: 0.7799, OV: 0.3638, AltV: 0.0986, CorV: 0.7617, TopV: 0.1883, BotRV: 0.0168, AllV: 0.0986 +[2026-01-29T21:46:49.632814Z] Loop 1060: Reg: 0.4467, AltReg: 0.7337, CorReg: 0.0161, TopReg: 0.6883, AllReg: 0.7337, BotRReg: 0.7636, OV: 0.3571, AltV: 0.0958, CorV: 0.7490, TopV: 0.1084, BotRV: 0.0331, AllV: 0.0958 +[2026-01-29T21:46:55.478130Z] Loop 1065: Reg: 0.4359, AltReg: 0.7251, CorReg: 0.0021, TopReg: 0.6568, AllReg: 0.7251, BotRReg: 0.7689, OV: 0.3678, AltV: 0.1044, CorV: 0.7630, TopV: 0.1398, BotRV: 0.0278, AllV: 0.1044 +[2026-01-29T21:47:01.336529Z] Loop 1070: Reg: 0.4361, AltReg: 0.7254, CorReg: 0.0022, TopReg: 0.6049, AllReg: 0.7254, BotRReg: 0.7781, OV: 0.3677, AltV: 0.1042, CorV: 0.7629, TopV: 0.1918, BotRV: 0.0186, AllV: 0.1042 +[2026-01-29T21:47:07.193025Z] Loop 1075: Reg: 0.4345, AltReg: 0.7229, CorReg: 0.0018, TopReg: 0.6020, AllReg: 0.7229, BotRReg: 0.7773, OV: 0.3693, AltV: 0.1067, CorV: 0.7633, TopV: 0.1947, BotRV: 0.0193, AllV: 0.1067 +[2026-01-29T21:47:13.046407Z] Loop 1080: Reg: 0.4315, AltReg: 0.7184, CorReg: 0.0011, TopReg: 0.6495, AllReg: 0.7184, BotRReg: 0.7666, OV: 0.3723, AltV: 0.1111, CorV: 0.7640, TopV: 0.1472, BotRV: 0.0301, AllV: 0.1111 +[2026-01-29T21:47:18.903198Z] Loop 1085: Reg: 0.4372, AltReg: 0.7232, CorReg: 0.0081, TopReg: 0.6822, AllReg: 0.7232, BotRReg: 0.7612, OV: 0.3666, AltV: 0.1064, CorV: 0.7570, TopV: 0.1145, BotRV: 0.0355, AllV: 0.1064 +[2026-01-29T21:47:24.752572Z] Loop 1090: Reg: 0.4297, AltReg: 0.7154, CorReg: 0.0012, TopReg: 0.6538, AllReg: 0.7154, BotRReg: 0.7643, OV: 0.3741, AltV: 0.1141, CorV: 0.7640, TopV: 0.1429, BotRV: 0.0324, AllV: 0.1141 +[2026-01-29T21:47:30.606406Z] Loop 1095: Reg: 0.4274, AltReg: 0.7120, CorReg: 0.0004, TopReg: 0.6139, AllReg: 0.7120, BotRReg: 0.7707, OV: 0.3764, AltV: 0.1176, CorV: 0.7647, TopV: 0.1828, BotRV: 0.0260, AllV: 0.1176 +[2026-01-29T21:47:36.460157Z] Loop 1100: Reg: 0.4258, AltReg: 0.7094, CorReg: 0.0004, TopReg: 0.6148, AllReg: 0.7094, BotRReg: 0.7687, OV: 0.3780, AltV: 0.1202, CorV: 0.7648, TopV: 0.1818, BotRV: 0.0280, AllV: 0.1202 +[2026-01-29T21:47:42.300717Z] Loop 1105: Reg: 0.4286, AltReg: 0.7125, CorReg: 0.0029, TopReg: 0.6631, AllReg: 0.7125, BotRReg: 0.7606, OV: 0.3751, AltV: 0.1171, CorV: 0.7622, TopV: 0.1336, BotRV: 0.0361, AllV: 0.1171 +[2026-01-29T21:47:48.140238Z] Loop 1110: Reg: 0.4260, AltReg: 0.7090, CorReg: 0.0013, TopReg: 0.5719, AllReg: 0.7090, BotRReg: 0.7741, OV: 0.3778, AltV: 0.1205, CorV: 0.7638, TopV: 0.2248, BotRV: 0.0226, AllV: 0.1205 +[2026-01-29T21:47:53.986552Z] Loop 1115: Reg: 0.4220, AltReg: 0.7031, CorReg: 0.0003, TopReg: 0.6138, AllReg: 0.7031, BotRReg: 0.7644, OV: 0.3818, AltV: 0.1265, CorV: 0.7649, TopV: 0.1829, BotRV: 0.0323, AllV: 0.1265 +[2026-01-29T21:47:59.842461Z] Loop 1120: Reg: 0.4233, AltReg: 0.7044, CorReg: 0.0016, TopReg: 0.6460, AllReg: 0.7044, BotRReg: 0.7602, OV: 0.3805, AltV: 0.1252, CorV: 0.7635, TopV: 0.1507, BotRV: 0.0365, AllV: 0.1252 +[2026-01-29T21:48:05.690980Z] Loop 1125: Reg: 0.4219, AltReg: 0.7018, CorReg: 0.0021, TopReg: 0.6464, AllReg: 0.7018, BotRReg: 0.7599, OV: 0.3818, AltV: 0.1277, CorV: 0.7630, TopV: 0.1503, BotRV: 0.0368, AllV: 0.1277 +[2026-01-29T21:48:11.546341Z] Loop 1130: Reg: 0.4170, AltReg: 0.6948, CorReg: 0.0003, TopReg: 0.5982, AllReg: 0.6948, BotRReg: 0.7637, OV: 0.3868, AltV: 0.1347, CorV: 0.7649, TopV: 0.1985, BotRV: 0.0330, AllV: 0.1347 +[2026-01-29T21:48:17.390456Z] Loop 1135: Reg: 0.4156, AltReg: 0.6924, CorReg: 0.0004, TopReg: 0.6109, AllReg: 0.6924, BotRReg: 0.7616, OV: 0.3882, AltV: 0.1371, CorV: 0.7647, TopV: 0.1857, BotRV: 0.0351, AllV: 0.1371 +[2026-01-29T21:48:23.231270Z] Loop 1140: Reg: 0.4132, AltReg: 0.6885, CorReg: 0.0003, TopReg: 0.5694, AllReg: 0.6885, BotRReg: 0.7654, OV: 0.3906, AltV: 0.1411, CorV: 0.7648, TopV: 0.2273, BotRV: 0.0312, AllV: 0.1411 +[2026-01-29T21:48:29.077342Z] Loop 1145: Reg: 0.4118, AltReg: 0.6860, CorReg: 0.0004, TopReg: 0.5524, AllReg: 0.6860, BotRReg: 0.7665, OV: 0.3920, AltV: 0.1436, CorV: 0.7647, TopV: 0.2443, BotRV: 0.0302, AllV: 0.1436 +[2026-01-29T21:48:34.922620Z] Loop 1150: Reg: 0.4083, AltReg: 0.6801, CorReg: 0.0006, TopReg: 0.5839, AllReg: 0.6801, BotRReg: 0.7609, OV: 0.3955, AltV: 0.1494, CorV: 0.7645, TopV: 0.2128, BotRV: 0.0357, AllV: 0.1494 +[2026-01-29T21:48:40.773941Z] Loop 1155: Reg: 0.4062, AltReg: 0.6764, CorReg: 0.0008, TopReg: 0.5835, AllReg: 0.6764, BotRReg: 0.7603, OV: 0.3976, AltV: 0.1532, CorV: 0.7643, TopV: 0.2132, BotRV: 0.0364, AllV: 0.1532 +[2026-01-29T21:48:46.627201Z] Loop 1160: Reg: 0.4037, AltReg: 0.6725, CorReg: 0.0003, TopReg: 0.5448, AllReg: 0.6725, BotRReg: 0.7624, OV: 0.4001, AltV: 0.1570, CorV: 0.7648, TopV: 0.2519, BotRV: 0.0343, AllV: 0.1570 +[2026-01-29T21:48:52.472220Z] Loop 1165: Reg: 0.4009, AltReg: 0.6680, CorReg: 0.0003, TopReg: 0.5416, AllReg: 0.6680, BotRReg: 0.7617, OV: 0.4028, AltV: 0.1615, CorV: 0.7648, TopV: 0.2551, BotRV: 0.0350, AllV: 0.1615 +[2026-01-29T21:48:58.316537Z] Loop 1170: Reg: 0.4025, AltReg: 0.6685, CorReg: 0.0036, TopReg: 0.5835, AllReg: 0.6685, BotRReg: 0.7593, OV: 0.4012, AltV: 0.1610, CorV: 0.7615, TopV: 0.2132, BotRV: 0.0374, AllV: 0.1610 +[2026-01-29T21:49:04.154912Z] Loop 1175: Reg: 0.3981, AltReg: 0.6632, CorReg: 0.0005, TopReg: 0.5221, AllReg: 0.6632, BotRReg: 0.7629, OV: 0.4057, AltV: 0.1664, CorV: 0.7646, TopV: 0.2746, BotRV: 0.0338, AllV: 0.1664 +[2026-01-29T21:49:09.995357Z] Loop 1180: Reg: 0.3968, AltReg: 0.6593, CorReg: 0.0031, TopReg: 0.5612, AllReg: 0.6593, BotRReg: 0.7594, OV: 0.4070, AltV: 0.1703, CorV: 0.7620, TopV: 0.2355, BotRV: 0.0373, AllV: 0.1703 +[2026-01-29T21:49:15.836780Z] Loop 1185: Reg: 0.3897, AltReg: 0.6493, CorReg: 0.0004, TopReg: 0.5365, AllReg: 0.6493, BotRReg: 0.7603, OV: 0.4140, AltV: 0.1802, CorV: 0.7647, TopV: 0.2602, BotRV: 0.0364, AllV: 0.1802 +[2026-01-29T21:49:21.678911Z] Loop 1190: Reg: 0.4087, AltReg: 0.6782, CorReg: 0.0045, TopReg: 0.4647, AllReg: 0.6782, BotRReg: 0.7734, OV: 0.3951, AltV: 0.1514, CorV: 0.7606, TopV: 0.3320, BotRV: 0.0233, AllV: 0.1514 +[2026-01-29T21:49:27.523567Z] Loop 1195: Reg: 0.3916, AltReg: 0.6513, CorReg: 0.0020, TopReg: 0.5513, AllReg: 0.6513, BotRReg: 0.7596, OV: 0.4122, AltV: 0.1782, CorV: 0.7631, TopV: 0.2454, BotRV: 0.0371, AllV: 0.1782 +[2026-01-29T21:49:33.370759Z] Loop 1200: Reg: 0.3852, AltReg: 0.6417, CorReg: 0.0004, TopReg: 0.5316, AllReg: 0.6417, BotRReg: 0.7600, OV: 0.4186, AltV: 0.1878, CorV: 0.7647, TopV: 0.2651, BotRV: 0.0367, AllV: 0.1878 +[2026-01-29T21:49:39.212659Z] Loop 1205: Reg: 0.3816, AltReg: 0.6358, CorReg: 0.0003, TopReg: 0.4943, AllReg: 0.6358, BotRReg: 0.7614, OV: 0.4221, AltV: 0.1937, CorV: 0.7648, TopV: 0.3024, BotRV: 0.0353, AllV: 0.1937 +[2026-01-29T21:49:45.065826Z] Loop 1210: Reg: 0.3830, AltReg: 0.6380, CorReg: 0.0006, TopReg: 0.4680, AllReg: 0.6380, BotRReg: 0.7633, OV: 0.4208, AltV: 0.1916, CorV: 0.7646, TopV: 0.3287, BotRV: 0.0334, AllV: 0.1916 +[2026-01-29T21:49:50.916174Z] Loop 1215: Reg: 0.3773, AltReg: 0.6286, CorReg: 0.0003, TopReg: 0.4720, AllReg: 0.6286, BotRReg: 0.7609, OV: 0.4265, AltV: 0.2010, CorV: 0.7648, TopV: 0.3247, BotRV: 0.0358, AllV: 0.2010 +[2026-01-29T21:49:56.766334Z] Loop 1220: Reg: 0.3752, AltReg: 0.6251, CorReg: 0.0003, TopReg: 0.4692, AllReg: 0.6251, BotRReg: 0.7602, OV: 0.4286, AltV: 0.2045, CorV: 0.7648, TopV: 0.3275, BotRV: 0.0365, AllV: 0.2045 +[2026-01-29T21:50:02.614203Z] Loop 1225: Reg: 0.3816, AltReg: 0.6336, CorReg: 0.0037, TopReg: 0.5120, AllReg: 0.6336, BotRReg: 0.7591, OV: 0.4221, AltV: 0.1960, CorV: 0.7614, TopV: 0.2847, BotRV: 0.0376, AllV: 0.1960 +[2026-01-29T21:50:08.464071Z] Loop 1230: Reg: 0.3762, AltReg: 0.6267, CorReg: 0.0004, TopReg: 0.4520, AllReg: 0.6267, BotRReg: 0.7616, OV: 0.4276, AltV: 0.2029, CorV: 0.7647, TopV: 0.3446, BotRV: 0.0351, AllV: 0.2029 +[2026-01-29T21:50:14.317377Z] Loop 1235: Reg: 0.3723, AltReg: 0.6203, CorReg: 0.0002, TopReg: 0.4611, AllReg: 0.6203, BotRReg: 0.7602, OV: 0.4315, AltV: 0.2092, CorV: 0.7649, TopV: 0.3356, BotRV: 0.0365, AllV: 0.2092 +[2026-01-29T21:50:20.166100Z] Loop 1240: Reg: 0.3749, AltReg: 0.6246, CorReg: 0.0003, TopReg: 0.4932, AllReg: 0.6246, BotRReg: 0.7590, OV: 0.4289, AltV: 0.2050, CorV: 0.7648, TopV: 0.3034, BotRV: 0.0377, AllV: 0.2050 +[2026-01-29T21:50:26.013578Z] Loop 1245: Reg: 0.3708, AltReg: 0.6179, CorReg: 0.0001, TopReg: 0.4701, AllReg: 0.6179, BotRReg: 0.7595, OV: 0.4330, AltV: 0.2117, CorV: 0.7650, TopV: 0.3266, BotRV: 0.0372, AllV: 0.2117 +[2026-01-29T21:50:31.855264Z] Loop 1250: Reg: 0.3709, AltReg: 0.6182, CorReg: 0.0001, TopReg: 0.4555, AllReg: 0.6182, BotRReg: 0.7607, OV: 0.4328, AltV: 0.2114, CorV: 0.7650, TopV: 0.3412, BotRV: 0.0360, AllV: 0.2114 +[2026-01-29T21:50:37.702581Z] Loop 1255: Reg: 0.3698, AltReg: 0.6162, CorReg: 0.0001, TopReg: 0.4672, AllReg: 0.6162, BotRReg: 0.7596, OV: 0.4340, AltV: 0.2133, CorV: 0.7650, TopV: 0.3295, BotRV: 0.0371, AllV: 0.2133 +[2026-01-29T21:50:43.549129Z] Loop 1260: Reg: 0.3695, AltReg: 0.6158, CorReg: 0.0001, TopReg: 0.4657, AllReg: 0.6158, BotRReg: 0.7596, OV: 0.4343, AltV: 0.2138, CorV: 0.7650, TopV: 0.3309, BotRV: 0.0371, AllV: 0.2138 +[2026-01-29T21:50:49.395097Z] Loop 1265: Reg: 0.3696, AltReg: 0.6159, CorReg: 0.0001, TopReg: 0.4457, AllReg: 0.6159, BotRReg: 0.7611, OV: 0.4342, AltV: 0.2137, CorV: 0.7650, TopV: 0.3510, BotRV: 0.0355, AllV: 0.2137 +[2026-01-29T21:50:55.239908Z] Loop 1270: Reg: 0.3760, AltReg: 0.6264, CorReg: 0.0005, TopReg: 0.4295, AllReg: 0.6264, BotRReg: 0.7659, OV: 0.4277, AltV: 0.2032, CorV: 0.7646, TopV: 0.3672, BotRV: 0.0308, AllV: 0.2032 +[2026-01-29T21:51:01.085125Z] Loop 1275: Reg: 0.3680, AltReg: 0.6134, CorReg: 0.0001, TopReg: 0.4520, AllReg: 0.6134, BotRReg: 0.7598, OV: 0.4357, AltV: 0.2162, CorV: 0.7650, TopV: 0.3447, BotRV: 0.0369, AllV: 0.2162 +[2026-01-29T21:51:06.930097Z] Loop 1280: Reg: 0.3772, AltReg: 0.6269, CorReg: 0.0027, TopReg: 0.5134, AllReg: 0.6269, BotRReg: 0.7588, OV: 0.4265, AltV: 0.2026, CorV: 0.7624, TopV: 0.2833, BotRV: 0.0379, AllV: 0.2026 +[2026-01-29T21:51:12.780280Z] Loop 1285: Reg: 0.3673, AltReg: 0.6121, CorReg: 0.0001, TopReg: 0.4448, AllReg: 0.6121, BotRReg: 0.7599, OV: 0.4365, AltV: 0.2174, CorV: 0.7651, TopV: 0.3519, BotRV: 0.0368, AllV: 0.2174 +[2026-01-29T21:51:18.651390Z] Loop 1290: Reg: 0.3819, AltReg: 0.6359, CorReg: 0.0010, TopReg: 0.4221, AllReg: 0.6359, BotRReg: 0.7697, OV: 0.4218, AltV: 0.1936, CorV: 0.7641, TopV: 0.3746, BotRV: 0.0270, AllV: 0.1936 +[2026-01-29T21:51:24.509607Z] Loop 1295: Reg: 0.3738, AltReg: 0.6224, CorReg: 0.0010, TopReg: 0.5010, AllReg: 0.6224, BotRReg: 0.7588, OV: 0.4300, AltV: 0.2072, CorV: 0.7641, TopV: 0.2956, BotRV: 0.0379, AllV: 0.2072 +[2026-01-29T21:51:30.360157Z] Loop 1300: Reg: 0.3746, AltReg: 0.6241, CorReg: 0.0005, TopReg: 0.5124, AllReg: 0.6241, BotRReg: 0.7588, OV: 0.4291, AltV: 0.2055, CorV: 0.7646, TopV: 0.2842, BotRV: 0.0379, AllV: 0.2055 +[2026-01-29T21:51:36.221334Z] Loop 1305: Reg: 0.3673, AltReg: 0.6122, CorReg: 0.0000, TopReg: 0.4610, AllReg: 0.6122, BotRReg: 0.7596, OV: 0.4364, AltV: 0.2174, CorV: 0.7651, TopV: 0.3357, BotRV: 0.0371, AllV: 0.2174 +[2026-01-29T21:51:42.073673Z] Loop 1310: Reg: 0.3724, AltReg: 0.6205, CorReg: 0.0002, TopReg: 0.4271, AllReg: 0.6205, BotRReg: 0.7685, OV: 0.4314, AltV: 0.2090, CorV: 0.7649, TopV: 0.3696, BotRV: 0.0282, AllV: 0.2090 +[2026-01-29T21:51:47.934665Z] Loop 1315: Reg: 0.3672, AltReg: 0.6119, CorReg: 0.0001, TopReg: 0.4307, AllReg: 0.6119, BotRReg: 0.7631, OV: 0.4366, AltV: 0.2176, CorV: 0.7650, TopV: 0.3660, BotRV: 0.0336, AllV: 0.2176 +[2026-01-29T21:51:53.786264Z] Loop 1320: Reg: 0.3656, AltReg: 0.6093, CorReg: 0.0000, TopReg: 0.4373, AllReg: 0.6093, BotRReg: 0.7603, OV: 0.4382, AltV: 0.2202, CorV: 0.7651, TopV: 0.3594, BotRV: 0.0364, AllV: 0.2202 +[2026-01-29T21:51:59.639011Z] Loop 1325: Reg: 0.3675, AltReg: 0.6124, CorReg: 0.0001, TopReg: 0.4657, AllReg: 0.6124, BotRReg: 0.7590, OV: 0.4363, AltV: 0.2171, CorV: 0.7651, TopV: 0.3310, BotRV: 0.0377, AllV: 0.2171 +[2026-01-29T21:52:05.494991Z] Loop 1330: Reg: 0.3667, AltReg: 0.6112, CorReg: 0.0000, TopReg: 0.4586, AllReg: 0.6112, BotRReg: 0.7590, OV: 0.4370, AltV: 0.2184, CorV: 0.7651, TopV: 0.3381, BotRV: 0.0377, AllV: 0.2184 +[2026-01-29T21:52:11.353666Z] Loop 1335: Reg: 0.3654, AltReg: 0.6089, CorReg: 0.0000, TopReg: 0.4448, AllReg: 0.6089, BotRReg: 0.7592, OV: 0.4384, AltV: 0.2206, CorV: 0.7651, TopV: 0.3519, BotRV: 0.0375, AllV: 0.2206 +[2026-01-29T21:52:17.207313Z] Loop 1340: Reg: 0.3647, AltReg: 0.6078, CorReg: 0.0000, TopReg: 0.4389, AllReg: 0.6078, BotRReg: 0.7594, OV: 0.4391, AltV: 0.2218, CorV: 0.7651, TopV: 0.3578, BotRV: 0.0373, AllV: 0.2218 +[2026-01-29T21:52:23.070732Z] Loop 1345: Reg: 0.3675, AltReg: 0.6123, CorReg: 0.0002, TopReg: 0.4129, AllReg: 0.6123, BotRReg: 0.7634, OV: 0.4363, AltV: 0.2173, CorV: 0.7649, TopV: 0.3838, BotRV: 0.0333, AllV: 0.2173 +[2026-01-29T21:52:28.937730Z] Loop 1350: Reg: 0.3646, AltReg: 0.6077, CorReg: 0.0001, TopReg: 0.4226, AllReg: 0.6077, BotRReg: 0.7608, OV: 0.4391, AltV: 0.2219, CorV: 0.7651, TopV: 0.3741, BotRV: 0.0359, AllV: 0.2219 +[2026-01-29T21:52:34.788293Z] Loop 1355: Reg: 0.3649, AltReg: 0.6080, CorReg: 0.0001, TopReg: 0.4449, AllReg: 0.6080, BotRReg: 0.7590, OV: 0.4389, AltV: 0.2215, CorV: 0.7650, TopV: 0.3518, BotRV: 0.0377, AllV: 0.2215 +[2026-01-29T21:52:40.652430Z] Loop 1360: Reg: 0.3733, AltReg: 0.6208, CorReg: 0.0019, TopReg: 0.5071, AllReg: 0.6208, BotRReg: 0.7588, OV: 0.4305, AltV: 0.2087, CorV: 0.7632, TopV: 0.2896, BotRV: 0.0379, AllV: 0.2087 +[2026-01-29T21:52:46.506251Z] Loop 1365: Reg: 0.3644, AltReg: 0.6074, CorReg: 0.0001, TopReg: 0.4447, AllReg: 0.6074, BotRReg: 0.7591, OV: 0.4393, AltV: 0.2222, CorV: 0.7651, TopV: 0.3520, BotRV: 0.0376, AllV: 0.2222 +[2026-01-29T21:52:52.370676Z] Loop 1370: Reg: 0.3632, AltReg: 0.6053, CorReg: 0.0000, TopReg: 0.4257, AllReg: 0.6053, BotRReg: 0.7604, OV: 0.4406, AltV: 0.2243, CorV: 0.7651, TopV: 0.3710, BotRV: 0.0363, AllV: 0.2243 +[2026-01-29T21:52:58.217320Z] Loop 1375: Reg: 0.3639, AltReg: 0.6065, CorReg: 0.0001, TopReg: 0.4144, AllReg: 0.6065, BotRReg: 0.7622, OV: 0.4398, AltV: 0.2230, CorV: 0.7651, TopV: 0.3823, BotRV: 0.0345, AllV: 0.2230 +[2026-01-29T21:53:04.059518Z] Loop 1380: Reg: 0.3632, AltReg: 0.6052, CorReg: 0.0000, TopReg: 0.4349, AllReg: 0.6052, BotRReg: 0.7595, OV: 0.4406, AltV: 0.2243, CorV: 0.7651, TopV: 0.3617, BotRV: 0.0372, AllV: 0.2243 +[2026-01-29T21:53:09.910272Z] Loop 1385: Reg: 0.3644, AltReg: 0.6073, CorReg: 0.0000, TopReg: 0.4463, AllReg: 0.6073, BotRReg: 0.7590, OV: 0.4394, AltV: 0.2223, CorV: 0.7651, TopV: 0.3504, BotRV: 0.0377, AllV: 0.2223 +[2026-01-29T21:53:15.772266Z] Loop 1390: Reg: 0.3628, AltReg: 0.6046, CorReg: 0.0000, TopReg: 0.4274, AllReg: 0.6046, BotRReg: 0.7605, OV: 0.4410, AltV: 0.2249, CorV: 0.7651, TopV: 0.3693, BotRV: 0.0362, AllV: 0.2249 +[2026-01-29T21:53:21.636456Z] Loop 1395: Reg: 0.3627, AltReg: 0.6045, CorReg: 0.0000, TopReg: 0.4325, AllReg: 0.6045, BotRReg: 0.7597, OV: 0.4411, AltV: 0.2250, CorV: 0.7651, TopV: 0.3642, BotRV: 0.0370, AllV: 0.2250 +[2026-01-29T21:53:27.484363Z] Loop 1400: Reg: 0.3642, AltReg: 0.6070, CorReg: 0.0000, TopReg: 0.4480, AllReg: 0.6070, BotRReg: 0.7590, OV: 0.4396, AltV: 0.2226, CorV: 0.7651, TopV: 0.3487, BotRV: 0.0377, AllV: 0.2226 +[2026-01-29T21:53:33.330022Z] Loop 1405: Reg: 0.3664, AltReg: 0.6105, CorReg: 0.0001, TopReg: 0.4677, AllReg: 0.6105, BotRReg: 0.7588, OV: 0.4374, AltV: 0.2190, CorV: 0.7650, TopV: 0.3290, BotRV: 0.0379, AllV: 0.2190 +[2026-01-29T21:53:39.179966Z] Loop 1410: Reg: 0.3656, AltReg: 0.6093, CorReg: 0.0001, TopReg: 0.4639, AllReg: 0.6093, BotRReg: 0.7588, OV: 0.4382, AltV: 0.2203, CorV: 0.7650, TopV: 0.3328, BotRV: 0.0379, AllV: 0.2203 +[2026-01-29T21:53:45.032659Z] Loop 1415: Reg: 0.3620, AltReg: 0.6034, CorReg: 0.0000, TopReg: 0.4327, AllReg: 0.6034, BotRReg: 0.7592, OV: 0.4417, AltV: 0.2262, CorV: 0.7651, TopV: 0.3640, BotRV: 0.0375, AllV: 0.2262 +[2026-01-29T21:53:50.880531Z] Loop 1420: Reg: 0.3611, AltReg: 0.6019, CorReg: 0.0000, TopReg: 0.4200, AllReg: 0.6019, BotRReg: 0.7596, OV: 0.4426, AltV: 0.2277, CorV: 0.7651, TopV: 0.3767, BotRV: 0.0370, AllV: 0.2277 +[2026-01-29T21:53:56.731413Z] Loop 1425: Reg: 0.3617, AltReg: 0.6028, CorReg: 0.0000, TopReg: 0.4059, AllReg: 0.6028, BotRReg: 0.7613, OV: 0.4421, AltV: 0.2268, CorV: 0.7651, TopV: 0.3908, BotRV: 0.0354, AllV: 0.2268 +[2026-01-29T21:54:02.577978Z] Loop 1430: Reg: 0.3608, AltReg: 0.6013, CorReg: 0.0000, TopReg: 0.4109, AllReg: 0.6013, BotRReg: 0.7601, OV: 0.4430, AltV: 0.2283, CorV: 0.7651, TopV: 0.3858, BotRV: 0.0366, AllV: 0.2283 +[2026-01-29T21:54:08.421015Z] Loop 1435: Reg: 0.3606, AltReg: 0.6010, CorReg: 0.0000, TopReg: 0.4124, AllReg: 0.6010, BotRReg: 0.7598, OV: 0.4432, AltV: 0.2286, CorV: 0.7651, TopV: 0.3843, BotRV: 0.0369, AllV: 0.2286 +[2026-01-29T21:54:14.266549Z] Loop 1440: Reg: 0.3606, AltReg: 0.6009, CorReg: 0.0000, TopReg: 0.4085, AllReg: 0.6009, BotRReg: 0.7601, OV: 0.4432, AltV: 0.2286, CorV: 0.7651, TopV: 0.3882, BotRV: 0.0366, AllV: 0.2286 +[2026-01-29T21:54:20.115205Z] Loop 1445: Reg: 0.3603, AltReg: 0.6005, CorReg: 0.0000, TopReg: 0.4107, AllReg: 0.6005, BotRReg: 0.7597, OV: 0.4435, AltV: 0.2291, CorV: 0.7651, TopV: 0.3860, BotRV: 0.0370, AllV: 0.2291 +[2026-01-29T21:54:25.958762Z] Loop 1450: Reg: 0.3620, AltReg: 0.6033, CorReg: 0.0001, TopReg: 0.4373, AllReg: 0.6033, BotRReg: 0.7589, OV: 0.4418, AltV: 0.2263, CorV: 0.7650, TopV: 0.3594, BotRV: 0.0378, AllV: 0.2263 +[2026-01-29T21:54:31.807262Z] Loop 1455: Reg: 0.3600, AltReg: 0.6000, CorReg: 0.0000, TopReg: 0.4111, AllReg: 0.6000, BotRReg: 0.7597, OV: 0.4438, AltV: 0.2295, CorV: 0.7651, TopV: 0.3856, BotRV: 0.0370, AllV: 0.2295 +[2026-01-29T21:54:37.652458Z] Loop 1460: Reg: 0.3603, AltReg: 0.6005, CorReg: 0.0000, TopReg: 0.4058, AllReg: 0.6005, BotRReg: 0.7608, OV: 0.4435, AltV: 0.2291, CorV: 0.7651, TopV: 0.3909, BotRV: 0.0359, AllV: 0.2291 +[2026-01-29T21:54:43.492657Z] Loop 1465: Reg: 0.3598, AltReg: 0.5997, CorReg: 0.0000, TopReg: 0.4076, AllReg: 0.5997, BotRReg: 0.7599, OV: 0.4440, AltV: 0.2299, CorV: 0.7651, TopV: 0.3891, BotRV: 0.0368, AllV: 0.2299 +[2026-01-29T21:54:49.339335Z] Loop 1470: Reg: 0.3623, AltReg: 0.6038, CorReg: 0.0001, TopReg: 0.4024, AllReg: 0.6038, BotRReg: 0.7629, OV: 0.4415, AltV: 0.2258, CorV: 0.7650, TopV: 0.3943, BotRV: 0.0338, AllV: 0.2258 +[2026-01-29T21:54:55.183879Z] Loop 1475: Reg: 0.3595, AltReg: 0.5991, CorReg: 0.0000, TopReg: 0.4073, AllReg: 0.5991, BotRReg: 0.7597, OV: 0.4443, AltV: 0.2304, CorV: 0.7651, TopV: 0.3894, BotRV: 0.0369, AllV: 0.2304 +[2026-01-29T21:55:01.028553Z] Loop 1480: Reg: 0.3630, AltReg: 0.6047, CorReg: 0.0005, TopReg: 0.4474, AllReg: 0.6047, BotRReg: 0.7589, OV: 0.4407, AltV: 0.2248, CorV: 0.7647, TopV: 0.3493, BotRV: 0.0378, AllV: 0.2248 +[2026-01-29T21:55:06.876325Z] Loop 1485: Reg: 0.3620, AltReg: 0.6031, CorReg: 0.0003, TopReg: 0.4381, AllReg: 0.6031, BotRReg: 0.7590, OV: 0.4418, AltV: 0.2265, CorV: 0.7648, TopV: 0.3586, BotRV: 0.0377, AllV: 0.2265 +[2026-01-29T21:55:12.725659Z] Loop 1490: Reg: 0.3610, AltReg: 0.6016, CorReg: 0.0001, TopReg: 0.4027, AllReg: 0.6016, BotRReg: 0.7622, OV: 0.4428, AltV: 0.2280, CorV: 0.7650, TopV: 0.3940, BotRV: 0.0345, AllV: 0.2280 +[2026-01-29T21:55:18.568588Z] Loop 1495: Reg: 0.3667, AltReg: 0.6104, CorReg: 0.0010, TopReg: 0.3925, AllReg: 0.6104, BotRReg: 0.7665, OV: 0.4371, AltV: 0.2191, CorV: 0.7641, TopV: 0.4042, BotRV: 0.0302, AllV: 0.2191 +[2026-01-29T21:55:24.411774Z] Loop 1500: Reg: 0.3604, AltReg: 0.6006, CorReg: 0.0001, TopReg: 0.4023, AllReg: 0.6006, BotRReg: 0.7621, OV: 0.4434, AltV: 0.2290, CorV: 0.7651, TopV: 0.3944, BotRV: 0.0345, AllV: 0.2290 +[2026-01-29T21:55:30.254787Z] Loop 1505: Reg: 0.3600, AltReg: 0.6000, CorReg: 0.0000, TopReg: 0.4226, AllReg: 0.6000, BotRReg: 0.7589, OV: 0.4438, AltV: 0.2295, CorV: 0.7651, TopV: 0.3741, BotRV: 0.0378, AllV: 0.2295 +[2026-01-29T21:55:36.100036Z] Loop 1510: Reg: 0.3633, AltReg: 0.6055, CorReg: 0.0001, TopReg: 0.4569, AllReg: 0.6055, BotRReg: 0.7587, OV: 0.4405, AltV: 0.2241, CorV: 0.7650, TopV: 0.3398, BotRV: 0.0380, AllV: 0.2241 +[2026-01-29T21:55:41.943057Z] Loop 1515: Reg: 0.3619, AltReg: 0.6031, CorReg: 0.0000, TopReg: 0.4432, AllReg: 0.6031, BotRReg: 0.7587, OV: 0.4419, AltV: 0.2264, CorV: 0.7651, TopV: 0.3535, BotRV: 0.0379, AllV: 0.2264 +[2026-01-29T21:55:47.789671Z] Loop 1520: Reg: 0.3587, AltReg: 0.5979, CorReg: 0.0000, TopReg: 0.4070, AllReg: 0.5979, BotRReg: 0.7595, OV: 0.4451, AltV: 0.2317, CorV: 0.7651, TopV: 0.3897, BotRV: 0.0372, AllV: 0.2317 +[2026-01-29T21:55:53.640034Z] Loop 1525: Reg: 0.3600, AltReg: 0.6000, CorReg: 0.0000, TopReg: 0.4021, AllReg: 0.6000, BotRReg: 0.7627, OV: 0.4437, AltV: 0.2295, CorV: 0.7651, TopV: 0.3946, BotRV: 0.0340, AllV: 0.2295 +[2026-01-29T21:55:59.484157Z] Loop 1530: Reg: 0.3587, AltReg: 0.5978, CorReg: 0.0000, TopReg: 0.4034, AllReg: 0.5978, BotRReg: 0.7606, OV: 0.4451, AltV: 0.2318, CorV: 0.7651, TopV: 0.3933, BotRV: 0.0361, AllV: 0.2318 +[2026-01-29T21:56:05.327472Z] Loop 1535: Reg: 0.3587, AltReg: 0.5979, CorReg: 0.0000, TopReg: 0.4104, AllReg: 0.5979, BotRReg: 0.7590, OV: 0.4450, AltV: 0.2317, CorV: 0.7651, TopV: 0.3863, BotRV: 0.0377, AllV: 0.2317 +[2026-01-29T21:56:11.169912Z] Loop 1540: Reg: 0.3625, AltReg: 0.6040, CorReg: 0.0001, TopReg: 0.4499, AllReg: 0.6040, BotRReg: 0.7587, OV: 0.4413, AltV: 0.2255, CorV: 0.7650, TopV: 0.3468, BotRV: 0.0380, AllV: 0.2255 +[2026-01-29T21:56:17.011325Z] Loop 1545: Reg: 0.3666, AltReg: 0.6105, CorReg: 0.0007, TopReg: 0.4937, AllReg: 0.6105, BotRReg: 0.7587, OV: 0.4372, AltV: 0.2190, CorV: 0.7644, TopV: 0.3030, BotRV: 0.0380, AllV: 0.2190 +[2026-01-29T21:56:22.852505Z] Loop 1550: Reg: 0.3603, AltReg: 0.6004, CorReg: 0.0001, TopReg: 0.4298, AllReg: 0.6004, BotRReg: 0.7588, OV: 0.4435, AltV: 0.2292, CorV: 0.7650, TopV: 0.3669, BotRV: 0.0379, AllV: 0.2292 +[2026-01-29T21:56:28.701481Z] Loop 1555: Reg: 0.3581, AltReg: 0.5967, CorReg: 0.0000, TopReg: 0.4034, AllReg: 0.5967, BotRReg: 0.7603, OV: 0.4457, AltV: 0.2328, CorV: 0.7651, TopV: 0.3933, BotRV: 0.0364, AllV: 0.2328 +[2026-01-29T21:56:34.550071Z] Loop 1560: Reg: 0.3617, AltReg: 0.6027, CorReg: 0.0002, TopReg: 0.3920, AllReg: 0.6027, BotRReg: 0.7633, OV: 0.4421, AltV: 0.2269, CorV: 0.7650, TopV: 0.4047, BotRV: 0.0334, AllV: 0.2269 +[2026-01-29T21:56:40.398552Z] Loop 1565: Reg: 0.3592, AltReg: 0.5987, CorReg: 0.0001, TopReg: 0.3989, AllReg: 0.5987, BotRReg: 0.7616, OV: 0.4445, AltV: 0.2309, CorV: 0.7651, TopV: 0.3978, BotRV: 0.0351, AllV: 0.2309 +[2026-01-29T21:56:46.254840Z] Loop 1570: Reg: 0.3579, AltReg: 0.5966, CorReg: 0.0000, TopReg: 0.4095, AllReg: 0.5966, BotRReg: 0.7591, OV: 0.4458, AltV: 0.2330, CorV: 0.7651, TopV: 0.3872, BotRV: 0.0376, AllV: 0.2330 +[2026-01-29T21:56:52.100644Z] Loop 1575: Reg: 0.3592, AltReg: 0.5987, CorReg: 0.0001, TopReg: 0.4218, AllReg: 0.5987, BotRReg: 0.7588, OV: 0.4445, AltV: 0.2309, CorV: 0.7650, TopV: 0.3749, BotRV: 0.0379, AllV: 0.2309 +[2026-01-29T21:56:57.965584Z] Loop 1580: Reg: 0.3577, AltReg: 0.5961, CorReg: 0.0000, TopReg: 0.4064, AllReg: 0.5961, BotRReg: 0.7593, OV: 0.4461, AltV: 0.2335, CorV: 0.7651, TopV: 0.3903, BotRV: 0.0374, AllV: 0.2335 +[2026-01-29T21:57:03.819327Z] Loop 1585: Reg: 0.3575, AltReg: 0.5958, CorReg: 0.0000, TopReg: 0.4048, AllReg: 0.5958, BotRReg: 0.7595, OV: 0.4463, AltV: 0.2337, CorV: 0.7651, TopV: 0.3919, BotRV: 0.0372, AllV: 0.2337 +[2026-01-29T21:57:09.674607Z] Loop 1590: Reg: 0.3575, AltReg: 0.5958, CorReg: 0.0000, TopReg: 0.4024, AllReg: 0.5958, BotRReg: 0.7602, OV: 0.4463, AltV: 0.2337, CorV: 0.7651, TopV: 0.3943, BotRV: 0.0364, AllV: 0.2337 +[2026-01-29T21:57:15.519868Z] Loop 1595: Reg: 0.3573, AltReg: 0.5956, CorReg: 0.0000, TopReg: 0.4027, AllReg: 0.5956, BotRReg: 0.7599, OV: 0.4464, AltV: 0.2340, CorV: 0.7651, TopV: 0.3939, BotRV: 0.0367, AllV: 0.2340 +[2026-01-29T21:57:21.374359Z] Loop 1600: Reg: 0.3573, AltReg: 0.5955, CorReg: 0.0000, TopReg: 0.4022, AllReg: 0.5955, BotRReg: 0.7602, OV: 0.4465, AltV: 0.2340, CorV: 0.7651, TopV: 0.3945, BotRV: 0.0365, AllV: 0.2340 +[2026-01-29T21:57:27.217025Z] Loop 1605: Reg: 0.3603, AltReg: 0.6005, CorReg: 0.0000, TopReg: 0.3944, AllReg: 0.6005, BotRReg: 0.7641, OV: 0.4435, AltV: 0.2291, CorV: 0.7651, TopV: 0.4023, BotRV: 0.0326, AllV: 0.2291 +[2026-01-29T21:57:33.064319Z] Loop 1610: Reg: 0.3592, AltReg: 0.5986, CorReg: 0.0000, TopReg: 0.3982, AllReg: 0.5986, BotRReg: 0.7635, OV: 0.4446, AltV: 0.2309, CorV: 0.7651, TopV: 0.3985, BotRV: 0.0331, AllV: 0.2309 +[2026-01-29T21:57:38.908083Z] Loop 1615: Reg: 0.3583, AltReg: 0.5972, CorReg: 0.0000, TopReg: 0.4110, AllReg: 0.5972, BotRReg: 0.7589, OV: 0.4455, AltV: 0.2323, CorV: 0.7651, TopV: 0.3857, BotRV: 0.0378, AllV: 0.2323 +[2026-01-29T21:57:44.756512Z] Loop 1620: Reg: 0.3602, AltReg: 0.6003, CorReg: 0.0000, TopReg: 0.4302, AllReg: 0.6003, BotRReg: 0.7587, OV: 0.4436, AltV: 0.2293, CorV: 0.7651, TopV: 0.3664, BotRV: 0.0380, AllV: 0.2293 +[2026-01-29T21:57:50.599853Z] Loop 1625: Reg: 0.3593, AltReg: 0.5989, CorReg: 0.0000, TopReg: 0.4212, AllReg: 0.5989, BotRReg: 0.7588, OV: 0.4445, AltV: 0.2307, CorV: 0.7651, TopV: 0.3754, BotRV: 0.0379, AllV: 0.2307 +[2026-01-29T21:57:56.444540Z] Loop 1630: Reg: 0.3582, AltReg: 0.5970, CorReg: 0.0000, TopReg: 0.4105, AllReg: 0.5970, BotRReg: 0.7589, OV: 0.4456, AltV: 0.2326, CorV: 0.7651, TopV: 0.3862, BotRV: 0.0378, AllV: 0.2326 +[2026-01-29T21:58:02.292961Z] Loop 1635: Reg: 0.3576, AltReg: 0.5960, CorReg: 0.0000, TopReg: 0.4065, AllReg: 0.5960, BotRReg: 0.7590, OV: 0.4462, AltV: 0.2336, CorV: 0.7651, TopV: 0.3901, BotRV: 0.0377, AllV: 0.2336 +[2026-01-29T21:58:08.136295Z] Loop 1640: Reg: 0.3568, AltReg: 0.5946, CorReg: 0.0000, TopReg: 0.4008, AllReg: 0.5946, BotRReg: 0.7602, OV: 0.4470, AltV: 0.2349, CorV: 0.7651, TopV: 0.3959, BotRV: 0.0365, AllV: 0.2349 +[2026-01-29T21:58:13.981486Z] Loop 1645: Reg: 0.3568, AltReg: 0.5946, CorReg: 0.0000, TopReg: 0.3993, AllReg: 0.5946, BotRReg: 0.7609, OV: 0.4470, AltV: 0.2349, CorV: 0.7651, TopV: 0.3974, BotRV: 0.0358, AllV: 0.2349 +[2026-01-29T21:58:19.837432Z] Loop 1650: Reg: 0.3568, AltReg: 0.5946, CorReg: 0.0000, TopReg: 0.4038, AllReg: 0.5946, BotRReg: 0.7594, OV: 0.4470, AltV: 0.2349, CorV: 0.7651, TopV: 0.3929, BotRV: 0.0373, AllV: 0.2349 +[2026-01-29T21:58:25.686959Z] Loop 1655: Reg: 0.3619, AltReg: 0.6031, CorReg: 0.0002, TopReg: 0.4543, AllReg: 0.6031, BotRReg: 0.7587, OV: 0.4418, AltV: 0.2265, CorV: 0.7649, TopV: 0.3424, BotRV: 0.0380, AllV: 0.2265 +[2026-01-29T21:58:31.541684Z] Loop 1660: Reg: 0.3574, AltReg: 0.5957, CorReg: 0.0000, TopReg: 0.4107, AllReg: 0.5957, BotRReg: 0.7589, OV: 0.4463, AltV: 0.2338, CorV: 0.7651, TopV: 0.3860, BotRV: 0.0378, AllV: 0.2338 +[2026-01-29T21:58:37.391034Z] Loop 1665: Reg: 0.3563, AltReg: 0.5938, CorReg: 0.0000, TopReg: 0.3914, AllReg: 0.5938, BotRReg: 0.7613, OV: 0.4475, AltV: 0.2358, CorV: 0.7651, TopV: 0.4053, BotRV: 0.0354, AllV: 0.2358 +[2026-01-29T21:58:43.235739Z] Loop 1670: Reg: 0.3564, AltReg: 0.5940, CorReg: 0.0000, TopReg: 0.3906, AllReg: 0.5940, BotRReg: 0.7618, OV: 0.4474, AltV: 0.2356, CorV: 0.7651, TopV: 0.4061, BotRV: 0.0349, AllV: 0.2356 +[2026-01-29T21:58:49.081215Z] Loop 1675: Reg: 0.3564, AltReg: 0.5940, CorReg: 0.0000, TopReg: 0.3929, AllReg: 0.5940, BotRReg: 0.7616, OV: 0.4474, AltV: 0.2356, CorV: 0.7651, TopV: 0.4038, BotRV: 0.0351, AllV: 0.2356 +[2026-01-29T21:58:54.923920Z] Loop 1680: Reg: 0.3565, AltReg: 0.5941, CorReg: 0.0000, TopReg: 0.3903, AllReg: 0.5941, BotRReg: 0.7621, OV: 0.4473, AltV: 0.2354, CorV: 0.7651, TopV: 0.4064, BotRV: 0.0346, AllV: 0.2354 +[2026-01-29T21:59:00.771163Z] Loop 1685: Reg: 0.3568, AltReg: 0.5947, CorReg: 0.0001, TopReg: 0.3872, AllReg: 0.5947, BotRReg: 0.7627, OV: 0.4470, AltV: 0.2349, CorV: 0.7651, TopV: 0.4095, BotRV: 0.0340, AllV: 0.2349 +[2026-01-29T21:59:06.623072Z] Loop 1690: Reg: 0.3639, AltReg: 0.6056, CorReg: 0.0013, TopReg: 0.3786, AllReg: 0.6056, BotRReg: 0.7672, OV: 0.4399, AltV: 0.2239, CorV: 0.7638, TopV: 0.4181, BotRV: 0.0295, AllV: 0.2239 +[2026-01-29T21:59:12.476710Z] Loop 1695: Reg: 0.3560, AltReg: 0.5933, CorReg: 0.0000, TopReg: 0.3884, AllReg: 0.5933, BotRReg: 0.7614, OV: 0.4478, AltV: 0.2363, CorV: 0.7651, TopV: 0.4083, BotRV: 0.0353, AllV: 0.2363 +[2026-01-29T21:59:18.325912Z] Loop 1700: Reg: 0.3562, AltReg: 0.5937, CorReg: 0.0000, TopReg: 0.4016, AllReg: 0.5937, BotRReg: 0.7590, OV: 0.4476, AltV: 0.2359, CorV: 0.7651, TopV: 0.3951, BotRV: 0.0376, AllV: 0.2359 +[2026-01-29T21:59:24.175108Z] Loop 1705: Reg: 0.3571, AltReg: 0.5951, CorReg: 0.0000, TopReg: 0.4080, AllReg: 0.5951, BotRReg: 0.7588, OV: 0.4467, AltV: 0.2344, CorV: 0.7651, TopV: 0.3887, BotRV: 0.0379, AllV: 0.2344 +[2026-01-29T21:59:30.021731Z] Loop 1710: Reg: 0.3578, AltReg: 0.5964, CorReg: 0.0000, TopReg: 0.4140, AllReg: 0.5964, BotRReg: 0.7587, OV: 0.4459, AltV: 0.2332, CorV: 0.7651, TopV: 0.3827, BotRV: 0.0380, AllV: 0.2332 +[2026-01-29T21:59:35.865703Z] Loop 1715: Reg: 0.3572, AltReg: 0.5953, CorReg: 0.0000, TopReg: 0.4104, AllReg: 0.5953, BotRReg: 0.7588, OV: 0.4466, AltV: 0.2342, CorV: 0.7651, TopV: 0.3863, BotRV: 0.0379, AllV: 0.2342 +[2026-01-29T21:59:41.721662Z] Loop 1720: Reg: 0.3562, AltReg: 0.5936, CorReg: 0.0000, TopReg: 0.4034, AllReg: 0.5936, BotRReg: 0.7590, OV: 0.4476, AltV: 0.2359, CorV: 0.7651, TopV: 0.3933, BotRV: 0.0377, AllV: 0.2359 +[2026-01-29T21:59:47.579147Z] Loop 1725: Reg: 0.3568, AltReg: 0.5946, CorReg: 0.0000, TopReg: 0.4092, AllReg: 0.5946, BotRReg: 0.7589, OV: 0.4470, AltV: 0.2349, CorV: 0.7651, TopV: 0.3875, BotRV: 0.0378, AllV: 0.2349 +[2026-01-29T21:59:53.425912Z] Loop 1730: Reg: 0.3558, AltReg: 0.5929, CorReg: 0.0000, TopReg: 0.4022, AllReg: 0.5929, BotRReg: 0.7591, OV: 0.4480, AltV: 0.2366, CorV: 0.7651, TopV: 0.3945, BotRV: 0.0375, AllV: 0.2366 +[2026-01-29T21:59:59.268954Z] Loop 1735: Reg: 0.3552, AltReg: 0.5919, CorReg: 0.0000, TopReg: 0.3982, AllReg: 0.5919, BotRReg: 0.7594, OV: 0.4486, AltV: 0.2376, CorV: 0.7651, TopV: 0.3985, BotRV: 0.0373, AllV: 0.2376 +[2026-01-29T22:00:05.110745Z] Loop 1740: Reg: 0.3545, AltReg: 0.5908, CorReg: 0.0001, TopReg: 0.3931, AllReg: 0.5908, BotRReg: 0.7599, OV: 0.4493, AltV: 0.2388, CorV: 0.7651, TopV: 0.4036, BotRV: 0.0368, AllV: 0.2388 +[2026-01-29T22:00:10.953766Z] Loop 1745: Reg: 0.3541, AltReg: 0.5900, CorReg: 0.0002, TopReg: 0.3825, AllReg: 0.5900, BotRReg: 0.7613, OV: 0.4497, AltV: 0.2395, CorV: 0.7649, TopV: 0.4142, BotRV: 0.0354, AllV: 0.2395 +[2026-01-29T22:00:16.799712Z] Loop 1750: Reg: 0.3644, AltReg: 0.6007, CorReg: 0.0100, TopReg: 0.3707, AllReg: 0.6007, BotRReg: 0.7655, OV: 0.4393, AltV: 0.2288, CorV: 0.7551, TopV: 0.4260, BotRV: 0.0312, AllV: 0.2288 +[2026-01-29T22:00:22.645164Z] Loop 1755: Reg: 0.3544, AltReg: 0.5904, CorReg: 0.0003, TopReg: 0.3776, AllReg: 0.5904, BotRReg: 0.7619, OV: 0.4494, AltV: 0.2391, CorV: 0.7648, TopV: 0.4191, BotRV: 0.0348, AllV: 0.2391 +[2026-01-29T22:00:28.496766Z] Loop 1760: Reg: 0.3557, AltReg: 0.5928, CorReg: 0.0001, TopReg: 0.4041, AllReg: 0.5928, BotRReg: 0.7591, OV: 0.4481, AltV: 0.2368, CorV: 0.7651, TopV: 0.3926, BotRV: 0.0376, AllV: 0.2368 +[2026-01-29T22:00:34.347347Z] Loop 1765: Reg: 0.3571, AltReg: 0.5951, CorReg: 0.0001, TopReg: 0.4168, AllReg: 0.5951, BotRReg: 0.7589, OV: 0.4467, AltV: 0.2344, CorV: 0.7650, TopV: 0.3799, BotRV: 0.0378, AllV: 0.2344 +[2026-01-29T22:00:40.197916Z] Loop 1770: Reg: 0.3538, AltReg: 0.5897, CorReg: 0.0000, TopReg: 0.3865, AllReg: 0.5897, BotRReg: 0.7605, OV: 0.4500, AltV: 0.2399, CorV: 0.7651, TopV: 0.4102, BotRV: 0.0362, AllV: 0.2399 +[2026-01-29T22:00:46.048343Z] Loop 1775: Reg: 0.3557, AltReg: 0.5926, CorReg: 0.0003, TopReg: 0.3724, AllReg: 0.5926, BotRReg: 0.7628, OV: 0.4481, AltV: 0.2370, CorV: 0.7648, TopV: 0.4243, BotRV: 0.0339, AllV: 0.2370 +[2026-01-29T22:00:51.895591Z] Loop 1780: Reg: 0.3544, AltReg: 0.5907, CorReg: 0.0000, TopReg: 0.3926, AllReg: 0.5907, BotRReg: 0.7595, OV: 0.4494, AltV: 0.2389, CorV: 0.7651, TopV: 0.4041, BotRV: 0.0372, AllV: 0.2389 +[2026-01-29T22:00:57.740314Z] Loop 1785: Reg: 0.3578, AltReg: 0.5963, CorReg: 0.0000, TopReg: 0.4225, AllReg: 0.5963, BotRReg: 0.7587, OV: 0.4460, AltV: 0.2332, CorV: 0.7651, TopV: 0.3742, BotRV: 0.0380, AllV: 0.2332 +[2026-01-29T22:01:03.585771Z] Loop 1790: Reg: 0.3570, AltReg: 0.5951, CorReg: 0.0000, TopReg: 0.4159, AllReg: 0.5951, BotRReg: 0.7588, OV: 0.4467, AltV: 0.2345, CorV: 0.7651, TopV: 0.3808, BotRV: 0.0379, AllV: 0.2345 +[2026-01-29T22:01:09.430958Z] Loop 1795: Reg: 0.3548, AltReg: 0.5913, CorReg: 0.0000, TopReg: 0.3966, AllReg: 0.5913, BotRReg: 0.7591, OV: 0.4490, AltV: 0.2382, CorV: 0.7651, TopV: 0.4000, BotRV: 0.0376, AllV: 0.2382 +[2026-01-29T22:01:15.282568Z] Loop 1800: Reg: 0.3548, AltReg: 0.5913, CorReg: 0.0000, TopReg: 0.3987, AllReg: 0.5913, BotRReg: 0.7591, OV: 0.4490, AltV: 0.2382, CorV: 0.7651, TopV: 0.3980, BotRV: 0.0376, AllV: 0.2382 +[2026-01-29T22:01:21.133724Z] Loop 1805: Reg: 0.3537, AltReg: 0.5894, CorReg: 0.0000, TopReg: 0.3894, AllReg: 0.5894, BotRReg: 0.7596, OV: 0.4501, AltV: 0.2402, CorV: 0.7651, TopV: 0.4073, BotRV: 0.0371, AllV: 0.2402 +[2026-01-29T22:01:26.974438Z] Loop 1810: Reg: 0.3552, AltReg: 0.5917, CorReg: 0.0004, TopReg: 0.3698, AllReg: 0.5917, BotRReg: 0.7626, OV: 0.4486, AltV: 0.2379, CorV: 0.7647, TopV: 0.4269, BotRV: 0.0341, AllV: 0.2379 +[2026-01-29T22:01:32.823220Z] Loop 1815: Reg: 0.3534, AltReg: 0.5890, CorReg: 0.0001, TopReg: 0.3741, AllReg: 0.5890, BotRReg: 0.7616, OV: 0.4504, AltV: 0.2406, CorV: 0.7651, TopV: 0.4226, BotRV: 0.0351, AllV: 0.2406 +[2026-01-29T22:01:38.670701Z] Loop 1820: Reg: 0.3535, AltReg: 0.5892, CorReg: 0.0000, TopReg: 0.3836, AllReg: 0.5892, BotRReg: 0.7605, OV: 0.4503, AltV: 0.2404, CorV: 0.7651, TopV: 0.4131, BotRV: 0.0362, AllV: 0.2404 +[2026-01-29T22:01:44.519698Z] Loop 1825: Reg: 0.3541, AltReg: 0.5901, CorReg: 0.0000, TopReg: 0.3904, AllReg: 0.5901, BotRReg: 0.7593, OV: 0.4497, AltV: 0.2394, CorV: 0.7651, TopV: 0.4063, BotRV: 0.0374, AllV: 0.2394 +[2026-01-29T22:01:50.360688Z] Loop 1830: Reg: 0.3536, AltReg: 0.5893, CorReg: 0.0000, TopReg: 0.3843, AllReg: 0.5893, BotRReg: 0.7604, OV: 0.4502, AltV: 0.2403, CorV: 0.7651, TopV: 0.4124, BotRV: 0.0363, AllV: 0.2403 +[2026-01-29T22:01:56.208078Z] Loop 1835: Reg: 0.3533, AltReg: 0.5889, CorReg: 0.0000, TopReg: 0.3794, AllReg: 0.5889, BotRReg: 0.7610, OV: 0.4504, AltV: 0.2407, CorV: 0.7651, TopV: 0.4173, BotRV: 0.0357, AllV: 0.2407 +[2026-01-29T22:02:02.061498Z] Loop 1840: Reg: 0.3533, AltReg: 0.5889, CorReg: 0.0000, TopReg: 0.3838, AllReg: 0.5889, BotRReg: 0.7602, OV: 0.4504, AltV: 0.2407, CorV: 0.7651, TopV: 0.4129, BotRV: 0.0365, AllV: 0.2407 +[2026-01-29T22:02:07.906222Z] Loop 1845: Reg: 0.3542, AltReg: 0.5903, CorReg: 0.0000, TopReg: 0.3931, AllReg: 0.5903, BotRReg: 0.7591, OV: 0.4496, AltV: 0.2392, CorV: 0.7651, TopV: 0.4036, BotRV: 0.0376, AllV: 0.2392 +[2026-01-29T22:02:13.748729Z] Loop 1850: Reg: 0.3543, AltReg: 0.5905, CorReg: 0.0000, TopReg: 0.3950, AllReg: 0.5905, BotRReg: 0.7591, OV: 0.4495, AltV: 0.2390, CorV: 0.7651, TopV: 0.4016, BotRV: 0.0376, AllV: 0.2390 +[2026-01-29T22:02:19.591986Z] Loop 1855: Reg: 0.3530, AltReg: 0.5883, CorReg: 0.0000, TopReg: 0.3799, AllReg: 0.5883, BotRReg: 0.7605, OV: 0.4508, AltV: 0.2413, CorV: 0.7651, TopV: 0.4168, BotRV: 0.0362, AllV: 0.2413 +[2026-01-29T22:02:25.441525Z] Loop 1860: Reg: 0.3537, AltReg: 0.5895, CorReg: 0.0001, TopReg: 0.3695, AllReg: 0.5895, BotRReg: 0.7628, OV: 0.4501, AltV: 0.2401, CorV: 0.7650, TopV: 0.4272, BotRV: 0.0338, AllV: 0.2401 +[2026-01-29T22:02:31.286326Z] Loop 1865: Reg: 0.3526, AltReg: 0.5876, CorReg: 0.0001, TopReg: 0.3710, AllReg: 0.5876, BotRReg: 0.7615, OV: 0.4512, AltV: 0.2419, CorV: 0.7651, TopV: 0.4257, BotRV: 0.0352, AllV: 0.2419 +[2026-01-29T22:02:37.138619Z] Loop 1870: Reg: 0.3526, AltReg: 0.5877, CorReg: 0.0000, TopReg: 0.3796, AllReg: 0.5877, BotRReg: 0.7599, OV: 0.4512, AltV: 0.2419, CorV: 0.7651, TopV: 0.4171, BotRV: 0.0368, AllV: 0.2419 +[2026-01-29T22:02:42.982325Z] Loop 1875: Reg: 0.3524, AltReg: 0.5872, CorReg: 0.0000, TopReg: 0.3770, AllReg: 0.5872, BotRReg: 0.7600, OV: 0.4514, AltV: 0.2423, CorV: 0.7651, TopV: 0.4197, BotRV: 0.0367, AllV: 0.2423 +[2026-01-29T22:02:48.824541Z] Loop 1880: Reg: 0.3522, AltReg: 0.5869, CorReg: 0.0001, TopReg: 0.3709, AllReg: 0.5869, BotRReg: 0.7610, OV: 0.4516, AltV: 0.2426, CorV: 0.7650, TopV: 0.4258, BotRV: 0.0357, AllV: 0.2426 +[2026-01-29T22:02:54.668743Z] Loop 1885: Reg: 0.3535, AltReg: 0.5889, CorReg: 0.0003, TopReg: 0.3688, AllReg: 0.5889, BotRReg: 0.7621, OV: 0.4503, AltV: 0.2406, CorV: 0.7648, TopV: 0.4279, BotRV: 0.0346, AllV: 0.2406 +[2026-01-29T22:03:00.516367Z] Loop 1890: Reg: 0.3530, AltReg: 0.5882, CorReg: 0.0002, TopReg: 0.3691, AllReg: 0.5882, BotRReg: 0.7618, OV: 0.4508, AltV: 0.2414, CorV: 0.7649, TopV: 0.4276, BotRV: 0.0349, AllV: 0.2414 +[2026-01-29T22:03:06.365967Z] Loop 1895: Reg: 0.3525, AltReg: 0.5874, CorReg: 0.0001, TopReg: 0.3694, AllReg: 0.5874, BotRReg: 0.7615, OV: 0.4513, AltV: 0.2422, CorV: 0.7650, TopV: 0.4273, BotRV: 0.0352, AllV: 0.2422 +[2026-01-29T22:03:12.226465Z] Loop 1900: Reg: 0.3520, AltReg: 0.5866, CorReg: 0.0000, TopReg: 0.3714, AllReg: 0.5866, BotRReg: 0.7606, OV: 0.4518, AltV: 0.2430, CorV: 0.7651, TopV: 0.4253, BotRV: 0.0361, AllV: 0.2430 +[2026-01-29T22:03:18.073487Z] Loop 1905: Reg: 0.3526, AltReg: 0.5876, CorReg: 0.0000, TopReg: 0.3817, AllReg: 0.5876, BotRReg: 0.7594, OV: 0.4512, AltV: 0.2419, CorV: 0.7651, TopV: 0.4149, BotRV: 0.0372, AllV: 0.2419 +[2026-01-29T22:03:23.918300Z] Loop 1910: Reg: 0.3531, AltReg: 0.5885, CorReg: 0.0001, TopReg: 0.3882, AllReg: 0.5885, BotRReg: 0.7592, OV: 0.4506, AltV: 0.2411, CorV: 0.7650, TopV: 0.4085, BotRV: 0.0375, AllV: 0.2411 +[2026-01-29T22:03:29.765615Z] Loop 1915: Reg: 0.3523, AltReg: 0.5872, CorReg: 0.0001, TopReg: 0.3790, AllReg: 0.5872, BotRReg: 0.7598, OV: 0.4514, AltV: 0.2424, CorV: 0.7650, TopV: 0.4177, BotRV: 0.0369, AllV: 0.2424 +[2026-01-29T22:03:35.617192Z] Loop 1920: Reg: 0.3556, AltReg: 0.5917, CorReg: 0.0014, TopReg: 0.3664, AllReg: 0.5917, BotRReg: 0.7629, OV: 0.4482, AltV: 0.2378, CorV: 0.7637, TopV: 0.4303, BotRV: 0.0338, AllV: 0.2378 +[2026-01-29T22:03:41.464987Z] Loop 1925: Reg: 0.3552, AltReg: 0.5914, CorReg: 0.0009, TopReg: 0.3664, AllReg: 0.5914, BotRReg: 0.7630, OV: 0.4486, AltV: 0.2381, CorV: 0.7642, TopV: 0.4303, BotRV: 0.0337, AllV: 0.2381 +[2026-01-29T22:03:47.312276Z] Loop 1930: Reg: 0.3521, AltReg: 0.5869, CorReg: 0.0000, TopReg: 0.3698, AllReg: 0.5869, BotRReg: 0.7612, OV: 0.4516, AltV: 0.2427, CorV: 0.7651, TopV: 0.4269, BotRV: 0.0355, AllV: 0.2427 +[2026-01-29T22:03:53.160279Z] Loop 1935: Reg: 0.3526, AltReg: 0.5876, CorReg: 0.0000, TopReg: 0.3698, AllReg: 0.5876, BotRReg: 0.7619, OV: 0.4512, AltV: 0.2419, CorV: 0.7651, TopV: 0.4269, BotRV: 0.0348, AllV: 0.2419 +[2026-01-29T22:03:59.005537Z] Loop 1940: Reg: 0.3525, AltReg: 0.5875, CorReg: 0.0000, TopReg: 0.3717, AllReg: 0.5875, BotRReg: 0.7612, OV: 0.4513, AltV: 0.2421, CorV: 0.7651, TopV: 0.4250, BotRV: 0.0355, AllV: 0.2421 +[2026-01-29T22:04:04.851931Z] Loop 1945: Reg: 0.3534, AltReg: 0.5891, CorReg: 0.0000, TopReg: 0.3892, AllReg: 0.5891, BotRReg: 0.7590, OV: 0.4503, AltV: 0.2405, CorV: 0.7651, TopV: 0.4075, BotRV: 0.0377, AllV: 0.2405 +[2026-01-29T22:04:10.698997Z] Loop 1950: Reg: 0.3541, AltReg: 0.5902, CorReg: 0.0000, TopReg: 0.3968, AllReg: 0.5902, BotRReg: 0.7588, OV: 0.4497, AltV: 0.2394, CorV: 0.7651, TopV: 0.3999, BotRV: 0.0379, AllV: 0.2394 +[2026-01-29T22:04:16.550435Z] Loop 1955: Reg: 0.3537, AltReg: 0.5895, CorReg: 0.0000, TopReg: 0.3946, AllReg: 0.5895, BotRReg: 0.7588, OV: 0.4501, AltV: 0.2400, CorV: 0.7651, TopV: 0.4021, BotRV: 0.0379, AllV: 0.2400 +[2026-01-29T22:04:22.399791Z] Loop 1960: Reg: 0.3540, AltReg: 0.5899, CorReg: 0.0000, TopReg: 0.3989, AllReg: 0.5899, BotRReg: 0.7588, OV: 0.4498, AltV: 0.2396, CorV: 0.7651, TopV: 0.3978, BotRV: 0.0379, AllV: 0.2396 +[2026-01-29T22:04:28.246061Z] Loop 1965: Reg: 0.3527, AltReg: 0.5878, CorReg: 0.0000, TopReg: 0.3845, AllReg: 0.5878, BotRReg: 0.7592, OV: 0.4511, AltV: 0.2418, CorV: 0.7651, TopV: 0.4122, BotRV: 0.0375, AllV: 0.2418 +[2026-01-29T22:04:34.096966Z] Loop 1970: Reg: 0.3518, AltReg: 0.5863, CorReg: 0.0000, TopReg: 0.3742, AllReg: 0.5863, BotRReg: 0.7600, OV: 0.4520, AltV: 0.2433, CorV: 0.7651, TopV: 0.4225, BotRV: 0.0367, AllV: 0.2433 +[2026-01-29T22:04:39.950666Z] Loop 1975: Reg: 0.3531, AltReg: 0.5882, CorReg: 0.0003, TopReg: 0.3676, AllReg: 0.5882, BotRReg: 0.7618, OV: 0.4507, AltV: 0.2413, CorV: 0.7649, TopV: 0.4291, BotRV: 0.0349, AllV: 0.2413 +[2026-01-29T22:04:45.802550Z] Loop 1980: Reg: 0.3521, AltReg: 0.5868, CorReg: 0.0001, TopReg: 0.3691, AllReg: 0.5868, BotRReg: 0.7613, OV: 0.4517, AltV: 0.2428, CorV: 0.7650, TopV: 0.4276, BotRV: 0.0354, AllV: 0.2428 +[2026-01-29T22:04:51.657455Z] Loop 1985: Reg: 0.3517, AltReg: 0.5861, CorReg: 0.0000, TopReg: 0.3706, AllReg: 0.5861, BotRReg: 0.7607, OV: 0.4521, AltV: 0.2435, CorV: 0.7651, TopV: 0.4261, BotRV: 0.0359, AllV: 0.2435 +[2026-01-29T22:04:57.505878Z] Loop 1990: Reg: 0.3516, AltReg: 0.5859, CorReg: 0.0000, TopReg: 0.3715, AllReg: 0.5859, BotRReg: 0.7604, OV: 0.4522, AltV: 0.2436, CorV: 0.7651, TopV: 0.4252, BotRV: 0.0363, AllV: 0.2436 +[2026-01-29T22:05:03.353458Z] Loop 1995: Reg: 0.3520, AltReg: 0.5866, CorReg: 0.0000, TopReg: 0.3774, AllReg: 0.5866, BotRReg: 0.7596, OV: 0.4518, AltV: 0.2429, CorV: 0.7651, TopV: 0.4193, BotRV: 0.0371, AllV: 0.2429 +[2026-01-29T22:05:09.200658Z] Loop 2000: Reg: 0.3529, AltReg: 0.5881, CorReg: 0.0000, TopReg: 0.3886, AllReg: 0.5881, BotRReg: 0.7591, OV: 0.4509, AltV: 0.2415, CorV: 0.7651, TopV: 0.4081, BotRV: 0.0376, AllV: 0.2415 +[2026-01-29T22:05:20.848473Z] Loop 2010: Reg: 0.3515, AltReg: 0.5858, CorReg: 0.0000, TopReg: 0.3716, AllReg: 0.5858, BotRReg: 0.7603, OV: 0.4523, AltV: 0.2437, CorV: 0.7651, TopV: 0.4250, BotRV: 0.0364, AllV: 0.2437 +[2026-01-29T22:05:32.509390Z] Loop 2020: Reg: 0.3515, AltReg: 0.5858, CorReg: 0.0000, TopReg: 0.3714, AllReg: 0.5858, BotRReg: 0.7604, OV: 0.4523, AltV: 0.2438, CorV: 0.7651, TopV: 0.4253, BotRV: 0.0363, AllV: 0.2438 +[2026-01-29T22:05:44.168131Z] Loop 2030: Reg: 0.3515, AltReg: 0.5857, CorReg: 0.0000, TopReg: 0.3710, AllReg: 0.5857, BotRReg: 0.7606, OV: 0.4523, AltV: 0.2438, CorV: 0.7651, TopV: 0.4257, BotRV: 0.0361, AllV: 0.2438 +[2026-01-29T22:05:55.818450Z] Loop 2040: Reg: 0.3533, AltReg: 0.5889, CorReg: 0.0001, TopReg: 0.3675, AllReg: 0.5889, BotRReg: 0.7634, OV: 0.4504, AltV: 0.2407, CorV: 0.7650, TopV: 0.4292, BotRV: 0.0333, AllV: 0.2407 +[2026-01-29T22:06:07.491284Z] Loop 2050: Reg: 0.3520, AltReg: 0.5866, CorReg: 0.0000, TopReg: 0.3728, AllReg: 0.5866, BotRReg: 0.7610, OV: 0.4518, AltV: 0.2429, CorV: 0.7651, TopV: 0.4239, BotRV: 0.0357, AllV: 0.2429 +[2026-01-29T22:06:19.168100Z] Loop 2060: Reg: 0.3537, AltReg: 0.5896, CorReg: 0.0000, TopReg: 0.3931, AllReg: 0.5896, BotRReg: 0.7588, OV: 0.4500, AltV: 0.2400, CorV: 0.7651, TopV: 0.4036, BotRV: 0.0379, AllV: 0.2400 +[2026-01-29T22:06:30.843897Z] Loop 2070: Reg: 0.3520, AltReg: 0.5866, CorReg: 0.0000, TopReg: 0.3760, AllReg: 0.5866, BotRReg: 0.7600, OV: 0.4518, AltV: 0.2430, CorV: 0.7651, TopV: 0.4207, BotRV: 0.0367, AllV: 0.2430 +[2026-01-29T22:06:42.503092Z] Loop 2080: Reg: 0.3528, AltReg: 0.5879, CorReg: 0.0001, TopReg: 0.3671, AllReg: 0.5879, BotRReg: 0.7625, OV: 0.4510, AltV: 0.2416, CorV: 0.7650, TopV: 0.4296, BotRV: 0.0342, AllV: 0.2416 +[2026-01-29T22:06:54.177024Z] Loop 2090: Reg: 0.3514, AltReg: 0.5857, CorReg: 0.0000, TopReg: 0.3693, AllReg: 0.5857, BotRReg: 0.7611, OV: 0.4523, AltV: 0.2438, CorV: 0.7651, TopV: 0.4274, BotRV: 0.0356, AllV: 0.2438 +[2026-01-29T22:07:05.842481Z] Loop 2100: Reg: 0.3544, AltReg: 0.5906, CorReg: 0.0001, TopReg: 0.3991, AllReg: 0.5906, BotRReg: 0.7587, OV: 0.4494, AltV: 0.2389, CorV: 0.7650, TopV: 0.3976, BotRV: 0.0380, AllV: 0.2389 +[2026-01-29T22:07:17.504420Z] Loop 2110: Reg: 0.3527, AltReg: 0.5879, CorReg: 0.0000, TopReg: 0.3857, AllReg: 0.5879, BotRReg: 0.7591, OV: 0.4510, AltV: 0.2417, CorV: 0.7651, TopV: 0.4109, BotRV: 0.0376, AllV: 0.2417 +[2026-01-29T22:07:29.169488Z] Loop 2120: Reg: 0.3562, AltReg: 0.5937, CorReg: 0.0000, TopReg: 0.3677, AllReg: 0.5937, BotRReg: 0.7650, OV: 0.4476, AltV: 0.2359, CorV: 0.7651, TopV: 0.4290, BotRV: 0.0316, AllV: 0.2359 +[2026-01-29T22:07:40.832731Z] Loop 2130: Reg: 0.3516, AltReg: 0.5861, CorReg: 0.0000, TopReg: 0.3717, AllReg: 0.5861, BotRReg: 0.7606, OV: 0.4521, AltV: 0.2435, CorV: 0.7651, TopV: 0.4250, BotRV: 0.0361, AllV: 0.2435 +[2026-01-29T22:07:52.490209Z] Loop 2140: Reg: 0.3515, AltReg: 0.5857, CorReg: 0.0000, TopReg: 0.3687, AllReg: 0.5857, BotRReg: 0.7617, OV: 0.4523, AltV: 0.2438, CorV: 0.7651, TopV: 0.4279, BotRV: 0.0350, AllV: 0.2438 +[2026-01-29T22:08:04.162977Z] Loop 2150: Reg: 0.3514, AltReg: 0.5857, CorReg: 0.0000, TopReg: 0.3703, AllReg: 0.5857, BotRReg: 0.7606, OV: 0.4523, AltV: 0.2438, CorV: 0.7651, TopV: 0.4264, BotRV: 0.0361, AllV: 0.2438 +[2026-01-29T22:08:15.809744Z] Loop 2160: Reg: 0.3515, AltReg: 0.5858, CorReg: 0.0000, TopReg: 0.3702, AllReg: 0.5858, BotRReg: 0.7609, OV: 0.4523, AltV: 0.2437, CorV: 0.7651, TopV: 0.4265, BotRV: 0.0357, AllV: 0.2437 +[2026-01-29T22:08:27.458698Z] Loop 2170: Reg: 0.3518, AltReg: 0.5863, CorReg: 0.0000, TopReg: 0.3686, AllReg: 0.5863, BotRReg: 0.7621, OV: 0.4520, AltV: 0.2433, CorV: 0.7651, TopV: 0.4281, BotRV: 0.0346, AllV: 0.2433 +[2026-01-29T22:08:39.143274Z] Loop 2180: Reg: 0.3523, AltReg: 0.5871, CorReg: 0.0000, TopReg: 0.3683, AllReg: 0.5871, BotRReg: 0.7623, OV: 0.4515, AltV: 0.2424, CorV: 0.7651, TopV: 0.4284, BotRV: 0.0343, AllV: 0.2424 +[2026-01-29T22:08:50.831533Z] Loop 2190: Reg: 0.3514, AltReg: 0.5857, CorReg: 0.0000, TopReg: 0.3705, AllReg: 0.5857, BotRReg: 0.7602, OV: 0.4524, AltV: 0.2439, CorV: 0.7651, TopV: 0.4262, BotRV: 0.0365, AllV: 0.2439 +[2026-01-29T22:09:02.497014Z] Loop 2200: Reg: 0.3536, AltReg: 0.5888, CorReg: 0.0008, TopReg: 0.3904, AllReg: 0.5888, BotRReg: 0.7590, OV: 0.4502, AltV: 0.2407, CorV: 0.7644, TopV: 0.4063, BotRV: 0.0377, AllV: 0.2407 +[2026-01-29T22:09:14.165581Z] Loop 2210: Reg: 0.3517, AltReg: 0.5861, CorReg: 0.0001, TopReg: 0.3754, AllReg: 0.5861, BotRReg: 0.7597, OV: 0.4521, AltV: 0.2434, CorV: 0.7650, TopV: 0.4213, BotRV: 0.0369, AllV: 0.2434 +[2026-01-29T22:09:25.829475Z] Loop 2220: Reg: 0.3527, AltReg: 0.5878, CorReg: 0.0001, TopReg: 0.3643, AllReg: 0.5878, BotRReg: 0.7627, OV: 0.4511, AltV: 0.2418, CorV: 0.7651, TopV: 0.4324, BotRV: 0.0340, AllV: 0.2418 +[2026-01-29T22:09:37.491939Z] Loop 2230: Reg: 0.3516, AltReg: 0.5859, CorReg: 0.0000, TopReg: 0.3665, AllReg: 0.5859, BotRReg: 0.7620, OV: 0.4522, AltV: 0.2436, CorV: 0.7651, TopV: 0.4302, BotRV: 0.0347, AllV: 0.2436 +[2026-01-29T22:09:49.160322Z] Loop 2240: Reg: 0.3513, AltReg: 0.5854, CorReg: 0.0000, TopReg: 0.3702, AllReg: 0.5854, BotRReg: 0.7603, OV: 0.4525, AltV: 0.2441, CorV: 0.7651, TopV: 0.4265, BotRV: 0.0363, AllV: 0.2441 +[2026-01-29T22:10:00.828356Z] Loop 2250: Reg: 0.3518, AltReg: 0.5863, CorReg: 0.0000, TopReg: 0.3672, AllReg: 0.5863, BotRReg: 0.7624, OV: 0.4520, AltV: 0.2433, CorV: 0.7651, TopV: 0.4294, BotRV: 0.0343, AllV: 0.2433 +[2026-01-29T22:10:12.472397Z] Loop 2260: Reg: 0.3512, AltReg: 0.5854, CorReg: 0.0000, TopReg: 0.3691, AllReg: 0.5854, BotRReg: 0.7612, OV: 0.4525, AltV: 0.2442, CorV: 0.7651, TopV: 0.4276, BotRV: 0.0354, AllV: 0.2442 +[2026-01-29T22:10:24.119544Z] Loop 2270: Reg: 0.3533, AltReg: 0.5889, CorReg: 0.0001, TopReg: 0.3929, AllReg: 0.5889, BotRReg: 0.7589, OV: 0.4504, AltV: 0.2407, CorV: 0.7651, TopV: 0.4038, BotRV: 0.0378, AllV: 0.2407 +[2026-01-29T22:10:35.786359Z] Loop 2280: Reg: 0.3518, AltReg: 0.5862, CorReg: 0.0000, TopReg: 0.3759, AllReg: 0.5862, BotRReg: 0.7597, OV: 0.4520, AltV: 0.2433, CorV: 0.7651, TopV: 0.4208, BotRV: 0.0370, AllV: 0.2433 +[2026-01-29T22:10:47.452030Z] Loop 2290: Reg: 0.3511, AltReg: 0.5852, CorReg: 0.0000, TopReg: 0.3682, AllReg: 0.5852, BotRReg: 0.7611, OV: 0.4527, AltV: 0.2444, CorV: 0.7651, TopV: 0.4285, BotRV: 0.0356, AllV: 0.2444 +[2026-01-29T22:10:59.103754Z] Loop 2300: Reg: 0.3546, AltReg: 0.5909, CorReg: 0.0002, TopReg: 0.3626, AllReg: 0.5909, BotRReg: 0.7642, OV: 0.4492, AltV: 0.2387, CorV: 0.7649, TopV: 0.4341, BotRV: 0.0325, AllV: 0.2387 +[2026-01-29T22:11:10.781792Z] Loop 2310: Reg: 0.3525, AltReg: 0.5874, CorReg: 0.0000, TopReg: 0.3675, AllReg: 0.5874, BotRReg: 0.7628, OV: 0.4513, AltV: 0.2421, CorV: 0.7651, TopV: 0.4292, BotRV: 0.0339, AllV: 0.2421 +[2026-01-29T22:11:22.457330Z] Loop 2320: Reg: 0.3521, AltReg: 0.5869, CorReg: 0.0000, TopReg: 0.3764, AllReg: 0.5869, BotRReg: 0.7612, OV: 0.4517, AltV: 0.2427, CorV: 0.7651, TopV: 0.4203, BotRV: 0.0355, AllV: 0.2427 +[2026-01-29T22:11:34.127766Z] Loop 2330: Reg: 0.3527, AltReg: 0.5878, CorReg: 0.0000, TopReg: 0.3849, AllReg: 0.5878, BotRReg: 0.7595, OV: 0.4511, AltV: 0.2417, CorV: 0.7651, TopV: 0.4118, BotRV: 0.0372, AllV: 0.2417 +[2026-01-29T22:11:45.779099Z] Loop 2340: Reg: 0.3523, AltReg: 0.5872, CorReg: 0.0000, TopReg: 0.3810, AllReg: 0.5872, BotRReg: 0.7592, OV: 0.4515, AltV: 0.2424, CorV: 0.7651, TopV: 0.4157, BotRV: 0.0375, AllV: 0.2424 +[2026-01-29T22:11:57.435581Z] Loop 2350: Reg: 0.3513, AltReg: 0.5854, CorReg: 0.0000, TopReg: 0.3682, AllReg: 0.5854, BotRReg: 0.7619, OV: 0.4525, AltV: 0.2441, CorV: 0.7651, TopV: 0.4285, BotRV: 0.0348, AllV: 0.2441 +[2026-01-29T22:12:09.099004Z] Loop 2360: Reg: 0.3521, AltReg: 0.5868, CorReg: 0.0000, TopReg: 0.3634, AllReg: 0.5868, BotRReg: 0.7629, OV: 0.4517, AltV: 0.2427, CorV: 0.7651, TopV: 0.4333, BotRV: 0.0338, AllV: 0.2427 +[2026-01-29T22:12:20.755506Z] Loop 2370: Reg: 0.3512, AltReg: 0.5852, CorReg: 0.0000, TopReg: 0.3702, AllReg: 0.5852, BotRReg: 0.7600, OV: 0.4526, AltV: 0.2443, CorV: 0.7651, TopV: 0.4265, BotRV: 0.0367, AllV: 0.2443 +[2026-01-29T22:12:32.419879Z] Loop 2380: Reg: 0.3552, AltReg: 0.5905, CorReg: 0.0022, TopReg: 0.4174, AllReg: 0.5905, BotRReg: 0.7591, OV: 0.4486, AltV: 0.2391, CorV: 0.7630, TopV: 0.3793, BotRV: 0.0376, AllV: 0.2391 +[2026-01-29T22:12:44.061443Z] Loop 2390: Reg: 0.3511, AltReg: 0.5852, CorReg: 0.0000, TopReg: 0.3669, AllReg: 0.5852, BotRReg: 0.7608, OV: 0.4526, AltV: 0.2444, CorV: 0.7651, TopV: 0.4298, BotRV: 0.0359, AllV: 0.2444 +[2026-01-29T22:12:55.705025Z] Loop 2400: Reg: 0.3521, AltReg: 0.5868, CorReg: 0.0001, TopReg: 0.3641, AllReg: 0.5868, BotRReg: 0.7626, OV: 0.4517, AltV: 0.2428, CorV: 0.7651, TopV: 0.4326, BotRV: 0.0341, AllV: 0.2428 +[2026-01-29T22:13:07.362431Z] Loop 2410: Reg: 0.3520, AltReg: 0.5866, CorReg: 0.0000, TopReg: 0.3821, AllReg: 0.5866, BotRReg: 0.7597, OV: 0.4518, AltV: 0.2429, CorV: 0.7651, TopV: 0.4146, BotRV: 0.0370, AllV: 0.2429 +[2026-01-29T22:13:19.018845Z] Loop 2420: Reg: 0.3546, AltReg: 0.5909, CorReg: 0.0001, TopReg: 0.4264, AllReg: 0.5909, BotRReg: 0.7593, OV: 0.4492, AltV: 0.2387, CorV: 0.7650, TopV: 0.3703, BotRV: 0.0374, AllV: 0.2387 +[2026-01-29T22:13:30.677365Z] Loop 2430: Reg: 0.3525, AltReg: 0.5874, CorReg: 0.0001, TopReg: 0.3934, AllReg: 0.5874, BotRReg: 0.7599, OV: 0.4513, AltV: 0.2421, CorV: 0.7650, TopV: 0.4033, BotRV: 0.0367, AllV: 0.2421 +[2026-01-29T22:13:42.329378Z] Loop 2440: Reg: 0.3517, AltReg: 0.5861, CorReg: 0.0001, TopReg: 0.3777, AllReg: 0.5861, BotRReg: 0.7607, OV: 0.4521, AltV: 0.2434, CorV: 0.7650, TopV: 0.4189, BotRV: 0.0359, AllV: 0.2434 +[2026-01-29T22:13:53.977665Z] Loop 2450: Reg: 0.3523, AltReg: 0.5871, CorReg: 0.0002, TopReg: 0.3834, AllReg: 0.5871, BotRReg: 0.7610, OV: 0.4514, AltV: 0.2425, CorV: 0.7649, TopV: 0.4133, BotRV: 0.0356, AllV: 0.2425 +[2026-01-29T22:14:05.629029Z] Loop 2460: Reg: 0.3537, AltReg: 0.5892, CorReg: 0.0005, TopReg: 0.3930, AllReg: 0.5892, BotRReg: 0.7615, OV: 0.4500, AltV: 0.2404, CorV: 0.7646, TopV: 0.4037, BotRV: 0.0352, AllV: 0.2404 +[2026-01-29T22:14:17.290743Z] Loop 2470: Reg: 0.3515, AltReg: 0.5858, CorReg: 0.0001, TopReg: 0.3757, AllReg: 0.5858, BotRReg: 0.7606, OV: 0.4522, AltV: 0.2437, CorV: 0.7650, TopV: 0.4210, BotRV: 0.0361, AllV: 0.2437 +[2026-01-29T22:14:28.943221Z] Loop 2480: Reg: 0.3510, AltReg: 0.5850, CorReg: 0.0000, TopReg: 0.3639, AllReg: 0.5850, BotRReg: 0.7614, OV: 0.4528, AltV: 0.2446, CorV: 0.7651, TopV: 0.4328, BotRV: 0.0353, AllV: 0.2446 +[2026-01-29T22:14:40.598189Z] Loop 2490: Reg: 0.3512, AltReg: 0.5853, CorReg: 0.0000, TopReg: 0.3645, AllReg: 0.5853, BotRReg: 0.7619, OV: 0.4526, AltV: 0.2442, CorV: 0.7651, TopV: 0.4322, BotRV: 0.0348, AllV: 0.2442 +[2026-01-29T22:14:52.250656Z] Loop 2500: Reg: 0.3520, AltReg: 0.5866, CorReg: 0.0000, TopReg: 0.3646, AllReg: 0.5866, BotRReg: 0.7630, OV: 0.4518, AltV: 0.2430, CorV: 0.7651, TopV: 0.4321, BotRV: 0.0337, AllV: 0.2430 +[2026-01-29T22:15:03.906672Z] Loop 2510: Reg: 0.3511, AltReg: 0.5851, CorReg: 0.0000, TopReg: 0.3687, AllReg: 0.5851, BotRReg: 0.7610, OV: 0.4527, AltV: 0.2444, CorV: 0.7651, TopV: 0.4279, BotRV: 0.0357, AllV: 0.2444 +[2026-01-29T22:15:15.579145Z] Loop 2520: Reg: 0.3548, AltReg: 0.5912, CorReg: 0.0000, TopReg: 0.4074, AllReg: 0.5912, BotRReg: 0.7586, OV: 0.4490, AltV: 0.2383, CorV: 0.7651, TopV: 0.3893, BotRV: 0.0381, AllV: 0.2383 +[2026-01-29T22:15:27.231057Z] Loop 2530: Reg: 0.3513, AltReg: 0.5855, CorReg: 0.0000, TopReg: 0.3718, AllReg: 0.5855, BotRReg: 0.7596, OV: 0.4525, AltV: 0.2440, CorV: 0.7651, TopV: 0.4249, BotRV: 0.0371, AllV: 0.2440 +[2026-01-29T22:15:38.891534Z] Loop 2540: Reg: 0.3510, AltReg: 0.5850, CorReg: 0.0000, TopReg: 0.3653, AllReg: 0.5850, BotRReg: 0.7617, OV: 0.4528, AltV: 0.2446, CorV: 0.7651, TopV: 0.4314, BotRV: 0.0350, AllV: 0.2446 +[2026-01-29T22:15:50.555278Z] Loop 2550: Reg: 0.3513, AltReg: 0.5854, CorReg: 0.0000, TopReg: 0.3630, AllReg: 0.5854, BotRReg: 0.7625, OV: 0.4525, AltV: 0.2441, CorV: 0.7651, TopV: 0.4337, BotRV: 0.0341, AllV: 0.2441 +[2026-01-29T22:16:02.215619Z] Loop 2560: Reg: 0.3531, AltReg: 0.5884, CorReg: 0.0002, TopReg: 0.3621, AllReg: 0.5884, BotRReg: 0.7636, OV: 0.4506, AltV: 0.2411, CorV: 0.7649, TopV: 0.4346, BotRV: 0.0331, AllV: 0.2411 +[2026-01-29T22:16:13.871472Z] Loop 2570: Reg: 0.3511, AltReg: 0.5851, CorReg: 0.0000, TopReg: 0.3690, AllReg: 0.5851, BotRReg: 0.7603, OV: 0.4527, AltV: 0.2445, CorV: 0.7651, TopV: 0.4276, BotRV: 0.0364, AllV: 0.2445 +[2026-01-29T22:16:25.525963Z] Loop 2580: Reg: 0.3520, AltReg: 0.5867, CorReg: 0.0000, TopReg: 0.3785, AllReg: 0.5867, BotRReg: 0.7589, OV: 0.4517, AltV: 0.2428, CorV: 0.7651, TopV: 0.4182, BotRV: 0.0378, AllV: 0.2428 +[2026-01-29T22:16:37.192981Z] Loop 2590: Reg: 0.3512, AltReg: 0.5853, CorReg: 0.0000, TopReg: 0.3701, AllReg: 0.5853, BotRReg: 0.7598, OV: 0.4526, AltV: 0.2442, CorV: 0.7651, TopV: 0.4266, BotRV: 0.0369, AllV: 0.2442 +[2026-01-29T22:16:48.849202Z] Loop 2600: Reg: 0.3510, AltReg: 0.5850, CorReg: 0.0000, TopReg: 0.3677, AllReg: 0.5850, BotRReg: 0.7613, OV: 0.4528, AltV: 0.2446, CorV: 0.7651, TopV: 0.4290, BotRV: 0.0354, AllV: 0.2446 +[2026-01-29T22:17:00.517946Z] Loop 2610: Reg: 0.3513, AltReg: 0.5854, CorReg: 0.0000, TopReg: 0.3637, AllReg: 0.5854, BotRReg: 0.7624, OV: 0.4525, AltV: 0.2441, CorV: 0.7651, TopV: 0.4330, BotRV: 0.0343, AllV: 0.2441 +[2026-01-29T22:17:12.183565Z] Loop 2620: Reg: 0.3513, AltReg: 0.5854, CorReg: 0.0000, TopReg: 0.3702, AllReg: 0.5854, BotRReg: 0.7599, OV: 0.4525, AltV: 0.2441, CorV: 0.7651, TopV: 0.4265, BotRV: 0.0368, AllV: 0.2441 +[2026-01-29T22:17:23.834919Z] Loop 2630: Reg: 0.3516, AltReg: 0.5860, CorReg: 0.0000, TopReg: 0.3724, AllReg: 0.5860, BotRReg: 0.7598, OV: 0.4522, AltV: 0.2436, CorV: 0.7651, TopV: 0.4243, BotRV: 0.0369, AllV: 0.2436 +[2026-01-29T22:17:35.487854Z] Loop 2640: Reg: 0.3518, AltReg: 0.5863, CorReg: 0.0000, TopReg: 0.3750, AllReg: 0.5863, BotRReg: 0.7591, OV: 0.4520, AltV: 0.2433, CorV: 0.7651, TopV: 0.4217, BotRV: 0.0376, AllV: 0.2433 +[2026-01-29T22:17:47.158010Z] Loop 2650: Reg: 0.3516, AltReg: 0.5860, CorReg: 0.0000, TopReg: 0.3684, AllReg: 0.5860, BotRReg: 0.7624, OV: 0.4522, AltV: 0.2436, CorV: 0.7651, TopV: 0.4283, BotRV: 0.0343, AllV: 0.2436 +[2026-01-29T22:17:58.820097Z] Loop 2660: Reg: 0.3510, AltReg: 0.5851, CorReg: 0.0000, TopReg: 0.3685, AllReg: 0.5851, BotRReg: 0.7614, OV: 0.4527, AltV: 0.2445, CorV: 0.7651, TopV: 0.4282, BotRV: 0.0353, AllV: 0.2445 +[2026-01-29T22:18:10.468082Z] Loop 2670: Reg: 0.3539, AltReg: 0.5898, CorReg: 0.0000, TopReg: 0.3962, AllReg: 0.5898, BotRReg: 0.7586, OV: 0.4499, AltV: 0.2397, CorV: 0.7651, TopV: 0.4005, BotRV: 0.0381, AllV: 0.2397 +[2026-01-29T22:18:22.136736Z] Loop 2680: Reg: 0.3527, AltReg: 0.5879, CorReg: 0.0000, TopReg: 0.3864, AllReg: 0.5879, BotRReg: 0.7586, OV: 0.4511, AltV: 0.2417, CorV: 0.7651, TopV: 0.4103, BotRV: 0.0380, AllV: 0.2417 +[2026-01-29T22:18:33.799033Z] Loop 2690: Reg: 0.3511, AltReg: 0.5851, CorReg: 0.0000, TopReg: 0.3700, AllReg: 0.5851, BotRReg: 0.7598, OV: 0.4527, AltV: 0.2445, CorV: 0.7651, TopV: 0.4266, BotRV: 0.0369, AllV: 0.2445 +[2026-01-29T22:18:45.452200Z] Loop 2700: Reg: 0.3510, AltReg: 0.5850, CorReg: 0.0000, TopReg: 0.3696, AllReg: 0.5850, BotRReg: 0.7599, OV: 0.4527, AltV: 0.2445, CorV: 0.7651, TopV: 0.4271, BotRV: 0.0368, AllV: 0.2445 +[2026-01-29T22:18:57.106622Z] Loop 2710: Reg: 0.3510, AltReg: 0.5850, CorReg: 0.0000, TopReg: 0.3693, AllReg: 0.5850, BotRReg: 0.7599, OV: 0.4528, AltV: 0.2446, CorV: 0.7651, TopV: 0.4274, BotRV: 0.0368, AllV: 0.2446 +[2026-01-29T22:19:08.785950Z] Loop 2720: Reg: 0.3507, AltReg: 0.5845, CorReg: 0.0000, TopReg: 0.3632, AllReg: 0.5845, BotRReg: 0.7610, OV: 0.4531, AltV: 0.2451, CorV: 0.7651, TopV: 0.4335, BotRV: 0.0357, AllV: 0.2451 +[2026-01-29T22:19:20.452153Z] Loop 2730: Reg: 0.3517, AltReg: 0.5861, CorReg: 0.0000, TopReg: 0.3620, AllReg: 0.5861, BotRReg: 0.7628, OV: 0.4521, AltV: 0.2434, CorV: 0.7651, TopV: 0.4347, BotRV: 0.0339, AllV: 0.2434 +[2026-01-29T22:19:32.110724Z] Loop 2740: Reg: 0.3508, AltReg: 0.5846, CorReg: 0.0000, TopReg: 0.3642, AllReg: 0.5846, BotRReg: 0.7612, OV: 0.4530, AltV: 0.2450, CorV: 0.7651, TopV: 0.4325, BotRV: 0.0355, AllV: 0.2450 +[2026-01-29T22:19:43.777201Z] Loop 2750: Reg: 0.3509, AltReg: 0.5848, CorReg: 0.0000, TopReg: 0.3671, AllReg: 0.5848, BotRReg: 0.7607, OV: 0.4529, AltV: 0.2448, CorV: 0.7651, TopV: 0.4296, BotRV: 0.0360, AllV: 0.2448 +[2026-01-29T22:19:55.442874Z] Loop 2760: Reg: 0.3509, AltReg: 0.5849, CorReg: 0.0000, TopReg: 0.3682, AllReg: 0.5849, BotRReg: 0.7603, OV: 0.4528, AltV: 0.2447, CorV: 0.7651, TopV: 0.4285, BotRV: 0.0364, AllV: 0.2447 +[2026-01-29T22:20:07.104398Z] Loop 2770: Reg: 0.3510, AltReg: 0.5850, CorReg: 0.0000, TopReg: 0.3692, AllReg: 0.5850, BotRReg: 0.7599, OV: 0.4528, AltV: 0.2445, CorV: 0.7651, TopV: 0.4274, BotRV: 0.0368, AllV: 0.2445 +[2026-01-29T22:20:18.760852Z] Loop 2780: Reg: 0.3508, AltReg: 0.5846, CorReg: 0.0000, TopReg: 0.3635, AllReg: 0.5846, BotRReg: 0.7616, OV: 0.4530, AltV: 0.2449, CorV: 0.7651, TopV: 0.4332, BotRV: 0.0351, AllV: 0.2449 +[2026-01-29T22:20:30.418746Z] Loop 2790: Reg: 0.3511, AltReg: 0.5852, CorReg: 0.0000, TopReg: 0.3624, AllReg: 0.5852, BotRReg: 0.7625, OV: 0.4527, AltV: 0.2444, CorV: 0.7651, TopV: 0.4343, BotRV: 0.0342, AllV: 0.2444 +[2026-01-29T22:20:42.077888Z] Loop 2800: Reg: 0.3527, AltReg: 0.5877, CorReg: 0.0001, TopReg: 0.3620, AllReg: 0.5877, BotRReg: 0.7634, OV: 0.4511, AltV: 0.2418, CorV: 0.7650, TopV: 0.4347, BotRV: 0.0333, AllV: 0.2418 +[2026-01-29T22:20:53.742140Z] Loop 2810: Reg: 0.3508, AltReg: 0.5847, CorReg: 0.0000, TopReg: 0.3644, AllReg: 0.5847, BotRReg: 0.7616, OV: 0.4529, AltV: 0.2448, CorV: 0.7651, TopV: 0.4323, BotRV: 0.0350, AllV: 0.2448 +[2026-01-29T22:21:05.395092Z] Loop 2820: Reg: 0.3507, AltReg: 0.5846, CorReg: 0.0000, TopReg: 0.3643, AllReg: 0.5846, BotRReg: 0.7609, OV: 0.4530, AltV: 0.2450, CorV: 0.7651, TopV: 0.4324, BotRV: 0.0357, AllV: 0.2450 +[2026-01-29T22:21:17.064243Z] Loop 2830: Reg: 0.3508, AltReg: 0.5846, CorReg: 0.0000, TopReg: 0.3659, AllReg: 0.5846, BotRReg: 0.7604, OV: 0.4530, AltV: 0.2449, CorV: 0.7651, TopV: 0.4308, BotRV: 0.0363, AllV: 0.2449 +[2026-01-29T22:21:28.730446Z] Loop 2840: Reg: 0.3518, AltReg: 0.5863, CorReg: 0.0000, TopReg: 0.3767, AllReg: 0.5863, BotRReg: 0.7587, OV: 0.4520, AltV: 0.2433, CorV: 0.7651, TopV: 0.4200, BotRV: 0.0380, AllV: 0.2433 +[2026-01-29T22:21:40.393225Z] Loop 2850: Reg: 0.3538, AltReg: 0.5886, CorReg: 0.0017, TopReg: 0.3943, AllReg: 0.5886, BotRReg: 0.7586, OV: 0.4499, AltV: 0.2410, CorV: 0.7634, TopV: 0.4024, BotRV: 0.0381, AllV: 0.2410 +[2026-01-29T22:21:52.054259Z] Loop 2860: Reg: 0.3509, AltReg: 0.5848, CorReg: 0.0000, TopReg: 0.3673, AllReg: 0.5848, BotRReg: 0.7598, OV: 0.4529, AltV: 0.2448, CorV: 0.7651, TopV: 0.4294, BotRV: 0.0369, AllV: 0.2448 +[2026-01-29T22:22:03.718166Z] Loop 2870: Reg: 0.3507, AltReg: 0.5846, CorReg: 0.0000, TopReg: 0.3627, AllReg: 0.5846, BotRReg: 0.7610, OV: 0.4530, AltV: 0.2450, CorV: 0.7651, TopV: 0.4340, BotRV: 0.0357, AllV: 0.2450 +[2026-01-29T22:22:15.363207Z] Loop 2880: Reg: 0.3507, AltReg: 0.5845, CorReg: 0.0000, TopReg: 0.3645, AllReg: 0.5845, BotRReg: 0.7603, OV: 0.4530, AltV: 0.2450, CorV: 0.7651, TopV: 0.4322, BotRV: 0.0364, AllV: 0.2450 +[2026-01-29T22:22:27.018783Z] Loop 2890: Reg: 0.3514, AltReg: 0.5856, CorReg: 0.0000, TopReg: 0.3749, AllReg: 0.5856, BotRReg: 0.7592, OV: 0.4524, AltV: 0.2440, CorV: 0.7651, TopV: 0.4218, BotRV: 0.0375, AllV: 0.2440 +[2026-01-29T22:22:38.685163Z] Loop 2900: Reg: 0.3511, AltReg: 0.5851, CorReg: 0.0000, TopReg: 0.3706, AllReg: 0.5851, BotRReg: 0.7595, OV: 0.4527, AltV: 0.2445, CorV: 0.7651, TopV: 0.4261, BotRV: 0.0372, AllV: 0.2445 +[2026-01-29T22:22:50.351823Z] Loop 2910: Reg: 0.3508, AltReg: 0.5846, CorReg: 0.0000, TopReg: 0.3659, AllReg: 0.5846, BotRReg: 0.7599, OV: 0.4530, AltV: 0.2449, CorV: 0.7651, TopV: 0.4308, BotRV: 0.0368, AllV: 0.2449 +[2026-01-29T22:23:02.019975Z] Loop 2920: Reg: 0.3507, AltReg: 0.5845, CorReg: 0.0000, TopReg: 0.3628, AllReg: 0.5845, BotRReg: 0.7609, OV: 0.4531, AltV: 0.2451, CorV: 0.7651, TopV: 0.4339, BotRV: 0.0358, AllV: 0.2451 +[2026-01-29T22:23:13.681843Z] Loop 2930: Reg: 0.3523, AltReg: 0.5871, CorReg: 0.0001, TopReg: 0.3620, AllReg: 0.5871, BotRReg: 0.7633, OV: 0.4515, AltV: 0.2425, CorV: 0.7650, TopV: 0.4347, BotRV: 0.0334, AllV: 0.2425 +[2026-01-29T22:23:25.343752Z] Loop 2940: Reg: 0.3565, AltReg: 0.5940, CorReg: 0.0001, TopReg: 0.3620, AllReg: 0.5940, BotRReg: 0.7654, OV: 0.4473, AltV: 0.2355, CorV: 0.7650, TopV: 0.4347, BotRV: 0.0312, AllV: 0.2355 +[2026-01-29T22:23:37.003294Z] Loop 2950: Reg: 0.3511, AltReg: 0.5851, CorReg: 0.0000, TopReg: 0.3661, AllReg: 0.5851, BotRReg: 0.7623, OV: 0.4527, AltV: 0.2444, CorV: 0.7651, TopV: 0.4306, BotRV: 0.0344, AllV: 0.2444 +[2026-01-29T22:23:48.661001Z] Loop 2960: Reg: 0.3514, AltReg: 0.5856, CorReg: 0.0000, TopReg: 0.3667, AllReg: 0.5856, BotRReg: 0.7624, OV: 0.4524, AltV: 0.2439, CorV: 0.7651, TopV: 0.4300, BotRV: 0.0343, AllV: 0.2439 +[2026-01-29T22:24:00.322440Z] Loop 2970: Reg: 0.3512, AltReg: 0.5853, CorReg: 0.0000, TopReg: 0.3686, AllReg: 0.5853, BotRReg: 0.7623, OV: 0.4526, AltV: 0.2442, CorV: 0.7651, TopV: 0.4281, BotRV: 0.0344, AllV: 0.2442 +[2026-01-29T22:24:11.992165Z] Loop 2980: Reg: 0.3511, AltReg: 0.5852, CorReg: 0.0000, TopReg: 0.3687, AllReg: 0.5852, BotRReg: 0.7621, OV: 0.4527, AltV: 0.2444, CorV: 0.7651, TopV: 0.4280, BotRV: 0.0346, AllV: 0.2444 +[2026-01-29T22:24:23.651976Z] Loop 2990: Reg: 0.3511, AltReg: 0.5852, CorReg: 0.0000, TopReg: 0.3696, AllReg: 0.5852, BotRReg: 0.7597, OV: 0.4527, AltV: 0.2444, CorV: 0.7651, TopV: 0.4271, BotRV: 0.0370, AllV: 0.2444 +[2026-01-29T22:24:35.305044Z] Loop 3000: Reg: 0.3530, AltReg: 0.5883, CorReg: 0.0000, TopReg: 0.3879, AllReg: 0.5883, BotRReg: 0.7586, OV: 0.4508, AltV: 0.2412, CorV: 0.7651, TopV: 0.4088, BotRV: 0.0381, AllV: 0.2412 +[2026-01-29T22:24:46.958369Z] Loop 3010: Reg: 0.3530, AltReg: 0.5880, CorReg: 0.0004, TopReg: 0.3883, AllReg: 0.5880, BotRReg: 0.7586, OV: 0.4508, AltV: 0.2415, CorV: 0.7647, TopV: 0.4084, BotRV: 0.0380, AllV: 0.2415 +[2026-01-29T22:24:58.641699Z] Loop 3020: Reg: 0.3520, AltReg: 0.5863, CorReg: 0.0006, TopReg: 0.3794, AllReg: 0.5863, BotRReg: 0.7594, OV: 0.4518, AltV: 0.2433, CorV: 0.7645, TopV: 0.4173, BotRV: 0.0373, AllV: 0.2433 +[2026-01-29T22:25:10.302092Z] Loop 3030: Reg: 0.3507, AltReg: 0.5845, CorReg: 0.0000, TopReg: 0.3651, AllReg: 0.5845, BotRReg: 0.7600, OV: 0.4531, AltV: 0.2450, CorV: 0.7651, TopV: 0.4315, BotRV: 0.0367, AllV: 0.2450 +[2026-01-29T22:25:21.955171Z] Loop 3040: Reg: 0.3507, AltReg: 0.5844, CorReg: 0.0000, TopReg: 0.3626, AllReg: 0.5844, BotRReg: 0.7607, OV: 0.4531, AltV: 0.2451, CorV: 0.7651, TopV: 0.4341, BotRV: 0.0359, AllV: 0.2451 +[2026-01-29T22:25:33.616083Z] Loop 3050: Reg: 0.3507, AltReg: 0.5844, CorReg: 0.0000, TopReg: 0.3624, AllReg: 0.5844, BotRReg: 0.7609, OV: 0.4531, AltV: 0.2451, CorV: 0.7651, TopV: 0.4343, BotRV: 0.0358, AllV: 0.2451 +[2026-01-29T22:25:45.271301Z] Loop 3060: Reg: 0.3506, AltReg: 0.5843, CorReg: 0.0000, TopReg: 0.3630, AllReg: 0.5843, BotRReg: 0.7604, OV: 0.4532, AltV: 0.2452, CorV: 0.7651, TopV: 0.4337, BotRV: 0.0363, AllV: 0.2452 +[2026-01-29T22:25:56.935342Z] Loop 3070: Reg: 0.3506, AltReg: 0.5843, CorReg: 0.0000, TopReg: 0.3632, AllReg: 0.5843, BotRReg: 0.7603, OV: 0.4532, AltV: 0.2452, CorV: 0.7651, TopV: 0.4335, BotRV: 0.0364, AllV: 0.2452 +[2026-01-29T22:26:08.593429Z] Loop 3080: Reg: 0.3513, AltReg: 0.5854, CorReg: 0.0001, TopReg: 0.3742, AllReg: 0.5854, BotRReg: 0.7595, OV: 0.4525, AltV: 0.2441, CorV: 0.7650, TopV: 0.4225, BotRV: 0.0372, AllV: 0.2441 +[2026-01-29T22:26:20.248187Z] Loop 3090: Reg: 0.3548, AltReg: 0.5894, CorReg: 0.0029, TopReg: 0.4086, AllReg: 0.5894, BotRReg: 0.7589, OV: 0.4490, AltV: 0.2401, CorV: 0.7623, TopV: 0.3881, BotRV: 0.0378, AllV: 0.2401 +[2026-01-29T22:26:31.902758Z] Loop 3100: Reg: 0.3517, AltReg: 0.5862, CorReg: 0.0001, TopReg: 0.3819, AllReg: 0.5862, BotRReg: 0.7593, OV: 0.4520, AltV: 0.2434, CorV: 0.7650, TopV: 0.4148, BotRV: 0.0374, AllV: 0.2434 +[2026-01-29T22:26:43.567429Z] Loop 3110: Reg: 0.3554, AltReg: 0.5919, CorReg: 0.0007, TopReg: 0.4358, AllReg: 0.5919, BotRReg: 0.7588, OV: 0.4484, AltV: 0.2376, CorV: 0.7645, TopV: 0.3609, BotRV: 0.0379, AllV: 0.2376 +[2026-01-29T22:26:55.233919Z] Loop 3120: Reg: 0.3526, AltReg: 0.5876, CorReg: 0.0001, TopReg: 0.3965, AllReg: 0.5876, BotRReg: 0.7593, OV: 0.4512, AltV: 0.2420, CorV: 0.7650, TopV: 0.4002, BotRV: 0.0374, AllV: 0.2420 +[2026-01-29T22:27:06.895042Z] Loop 3130: Reg: 0.3508, AltReg: 0.5847, CorReg: 0.0000, TopReg: 0.3671, AllReg: 0.5847, BotRReg: 0.7599, OV: 0.4529, AltV: 0.2448, CorV: 0.7651, TopV: 0.4296, BotRV: 0.0368, AllV: 0.2448 +[2026-01-29T22:27:18.558200Z] Loop 3140: Reg: 0.3508, AltReg: 0.5846, CorReg: 0.0000, TopReg: 0.3622, AllReg: 0.5846, BotRReg: 0.7614, OV: 0.4530, AltV: 0.2449, CorV: 0.7651, TopV: 0.4345, BotRV: 0.0353, AllV: 0.2449 +[2026-01-29T22:27:30.219174Z] Loop 3150: Reg: 0.3508, AltReg: 0.5846, CorReg: 0.0000, TopReg: 0.3623, AllReg: 0.5846, BotRReg: 0.7615, OV: 0.4530, AltV: 0.2449, CorV: 0.7651, TopV: 0.4344, BotRV: 0.0352, AllV: 0.2449 +[2026-01-29T22:27:41.883479Z] Loop 3160: Reg: 0.3507, AltReg: 0.5844, CorReg: 0.0000, TopReg: 0.3632, AllReg: 0.5844, BotRReg: 0.7610, OV: 0.4531, AltV: 0.2451, CorV: 0.7651, TopV: 0.4335, BotRV: 0.0357, AllV: 0.2451 +[2026-01-29T22:27:53.548076Z] Loop 3170: Reg: 0.3507, AltReg: 0.5844, CorReg: 0.0000, TopReg: 0.3629, AllReg: 0.5844, BotRReg: 0.7611, OV: 0.4531, AltV: 0.2451, CorV: 0.7651, TopV: 0.4338, BotRV: 0.0356, AllV: 0.2451 +[2026-01-29T22:28:05.209911Z] Loop 3180: Reg: 0.3507, AltReg: 0.5846, CorReg: 0.0000, TopReg: 0.3649, AllReg: 0.5846, BotRReg: 0.7607, OV: 0.4530, AltV: 0.2450, CorV: 0.7651, TopV: 0.4318, BotRV: 0.0360, AllV: 0.2450 +[2026-01-29T22:28:16.872729Z] Loop 3190: Reg: 0.3511, AltReg: 0.5852, CorReg: 0.0000, TopReg: 0.3718, AllReg: 0.5852, BotRReg: 0.7596, OV: 0.4526, AltV: 0.2443, CorV: 0.7651, TopV: 0.4248, BotRV: 0.0371, AllV: 0.2443 +[2026-01-29T22:28:28.539560Z] Loop 3200: Reg: 0.3508, AltReg: 0.5847, CorReg: 0.0000, TopReg: 0.3668, AllReg: 0.5847, BotRReg: 0.7599, OV: 0.4530, AltV: 0.2449, CorV: 0.7651, TopV: 0.4298, BotRV: 0.0367, AllV: 0.2449 +[2026-01-29T22:28:40.201419Z] Loop 3210: Reg: 0.3507, AltReg: 0.5844, CorReg: 0.0000, TopReg: 0.3624, AllReg: 0.5844, BotRReg: 0.7610, OV: 0.4531, AltV: 0.2451, CorV: 0.7651, TopV: 0.4343, BotRV: 0.0357, AllV: 0.2451 +[2026-01-29T22:28:51.869109Z] Loop 3220: Reg: 0.3507, AltReg: 0.5844, CorReg: 0.0000, TopReg: 0.3627, AllReg: 0.5844, BotRReg: 0.7608, OV: 0.4531, AltV: 0.2451, CorV: 0.7651, TopV: 0.4340, BotRV: 0.0358, AllV: 0.2451 +[2026-01-29T22:29:03.528511Z] Loop 3230: Reg: 0.3507, AltReg: 0.5845, CorReg: 0.0000, TopReg: 0.3624, AllReg: 0.5845, BotRReg: 0.7611, OV: 0.4531, AltV: 0.2450, CorV: 0.7651, TopV: 0.4343, BotRV: 0.0356, AllV: 0.2450 +[2026-01-29T22:29:15.192717Z] Loop 3240: Reg: 0.3507, AltReg: 0.5845, CorReg: 0.0000, TopReg: 0.3640, AllReg: 0.5845, BotRReg: 0.7603, OV: 0.4531, AltV: 0.2451, CorV: 0.7651, TopV: 0.4327, BotRV: 0.0364, AllV: 0.2451 +[2026-01-29T22:29:26.857961Z] Loop 3250: Reg: 0.3510, AltReg: 0.5850, CorReg: 0.0000, TopReg: 0.3700, AllReg: 0.5850, BotRReg: 0.7597, OV: 0.4528, AltV: 0.2446, CorV: 0.7651, TopV: 0.4267, BotRV: 0.0370, AllV: 0.2446 +[2026-01-29T22:29:38.520200Z] Loop 3260: Reg: 0.3511, AltReg: 0.5852, CorReg: 0.0000, TopReg: 0.3715, AllReg: 0.5852, BotRReg: 0.7597, OV: 0.4527, AltV: 0.2444, CorV: 0.7651, TopV: 0.4252, BotRV: 0.0370, AllV: 0.2444 +[2026-01-29T22:29:50.174948Z] Loop 3270: Reg: 0.3508, AltReg: 0.5846, CorReg: 0.0000, TopReg: 0.3660, AllReg: 0.5846, BotRReg: 0.7599, OV: 0.4530, AltV: 0.2449, CorV: 0.7651, TopV: 0.4307, BotRV: 0.0367, AllV: 0.2449 +[2026-01-29T22:30:01.829192Z] Loop 3280: Reg: 0.3507, AltReg: 0.5845, CorReg: 0.0000, TopReg: 0.3649, AllReg: 0.5845, BotRReg: 0.7601, OV: 0.4531, AltV: 0.2451, CorV: 0.7651, TopV: 0.4318, BotRV: 0.0366, AllV: 0.2451 +[2026-01-29T22:30:13.491819Z] Loop 3290: Reg: 0.3506, AltReg: 0.5844, CorReg: 0.0000, TopReg: 0.3630, AllReg: 0.5844, BotRReg: 0.7606, OV: 0.4531, AltV: 0.2452, CorV: 0.7651, TopV: 0.4337, BotRV: 0.0361, AllV: 0.2452 +[2026-01-29T22:30:25.156659Z] Loop 3300: Reg: 0.3507, AltReg: 0.5845, CorReg: 0.0000, TopReg: 0.3622, AllReg: 0.5845, BotRReg: 0.7611, OV: 0.4531, AltV: 0.2451, CorV: 0.7651, TopV: 0.4345, BotRV: 0.0356, AllV: 0.2451 +[2026-01-29T22:30:36.817494Z] Loop 3310: Reg: 0.3617, AltReg: 0.5997, CorReg: 0.0046, TopReg: 0.3678, AllReg: 0.5997, BotRReg: 0.7676, OV: 0.4421, AltV: 0.2298, CorV: 0.7605, TopV: 0.4289, BotRV: 0.0290, AllV: 0.2298 +[2026-01-29T22:30:48.485063Z] Loop 3320: Reg: 0.3507, AltReg: 0.5845, CorReg: 0.0000, TopReg: 0.3634, AllReg: 0.5845, BotRReg: 0.7609, OV: 0.4531, AltV: 0.2451, CorV: 0.7651, TopV: 0.4333, BotRV: 0.0358, AllV: 0.2451 +[2026-01-29T22:31:00.157505Z] Loop 3330: Reg: 0.3511, AltReg: 0.5851, CorReg: 0.0000, TopReg: 0.3698, AllReg: 0.5851, BotRReg: 0.7598, OV: 0.4527, AltV: 0.2444, CorV: 0.7651, TopV: 0.4269, BotRV: 0.0369, AllV: 0.2444 +[2026-01-29T22:31:11.822697Z] Loop 3340: Reg: 0.3521, AltReg: 0.5868, CorReg: 0.0000, TopReg: 0.3674, AllReg: 0.5868, BotRReg: 0.7629, OV: 0.4517, AltV: 0.2428, CorV: 0.7651, TopV: 0.4293, BotRV: 0.0338, AllV: 0.2428 +[2026-01-29T22:31:23.480888Z] Loop 3350: Reg: 0.3510, AltReg: 0.5849, CorReg: 0.0000, TopReg: 0.3686, AllReg: 0.5849, BotRReg: 0.7607, OV: 0.4528, AltV: 0.2446, CorV: 0.7651, TopV: 0.4281, BotRV: 0.0360, AllV: 0.2446 +[2026-01-29T22:31:35.149139Z] Loop 3360: Reg: 0.3518, AltReg: 0.5864, CorReg: 0.0000, TopReg: 0.3796, AllReg: 0.5864, BotRReg: 0.7587, OV: 0.4519, AltV: 0.2432, CorV: 0.7651, TopV: 0.4171, BotRV: 0.0379, AllV: 0.2432 +[2026-01-29T22:31:46.826165Z] Loop 3370: Reg: 0.3522, AltReg: 0.5870, CorReg: 0.0000, TopReg: 0.3861, AllReg: 0.5870, BotRReg: 0.7587, OV: 0.4516, AltV: 0.2425, CorV: 0.7651, TopV: 0.4106, BotRV: 0.0380, AllV: 0.2425 +[2026-01-29T22:31:58.502529Z] Loop 3380: Reg: 0.3510, AltReg: 0.5849, CorReg: 0.0000, TopReg: 0.3699, AllReg: 0.5849, BotRReg: 0.7597, OV: 0.4528, AltV: 0.2446, CorV: 0.7651, TopV: 0.4268, BotRV: 0.0370, AllV: 0.2446 +[2026-01-29T22:32:10.159734Z] Loop 3390: Reg: 0.3506, AltReg: 0.5844, CorReg: 0.0000, TopReg: 0.3644, AllReg: 0.5844, BotRReg: 0.7601, OV: 0.4531, AltV: 0.2451, CorV: 0.7651, TopV: 0.4323, BotRV: 0.0366, AllV: 0.2451 +[2026-01-29T22:32:21.829471Z] Loop 3400: Reg: 0.3507, AltReg: 0.5845, CorReg: 0.0000, TopReg: 0.3651, AllReg: 0.5845, BotRReg: 0.7599, OV: 0.4531, AltV: 0.2451, CorV: 0.7651, TopV: 0.4316, BotRV: 0.0368, AllV: 0.2451 +[2026-01-29T22:32:33.499908Z] Loop 3410: Reg: 0.3506, AltReg: 0.5843, CorReg: 0.0000, TopReg: 0.3634, AllReg: 0.5843, BotRReg: 0.7602, OV: 0.4532, AltV: 0.2452, CorV: 0.7651, TopV: 0.4333, BotRV: 0.0365, AllV: 0.2452 +[2026-01-29T22:32:45.163027Z] Loop 3420: Reg: 0.3509, AltReg: 0.5848, CorReg: 0.0000, TopReg: 0.3687, AllReg: 0.5848, BotRReg: 0.7598, OV: 0.4529, AltV: 0.2448, CorV: 0.7651, TopV: 0.4279, BotRV: 0.0369, AllV: 0.2448 +[2026-01-29T22:32:56.828016Z] Loop 3430: Reg: 0.3507, AltReg: 0.5845, CorReg: 0.0000, TopReg: 0.3659, AllReg: 0.5845, BotRReg: 0.7599, OV: 0.4530, AltV: 0.2450, CorV: 0.7651, TopV: 0.4307, BotRV: 0.0368, AllV: 0.2450 +[2026-01-29T22:33:08.494379Z] Loop 3440: Reg: 0.3506, AltReg: 0.5844, CorReg: 0.0000, TopReg: 0.3640, AllReg: 0.5844, BotRReg: 0.7600, OV: 0.4532, AltV: 0.2452, CorV: 0.7651, TopV: 0.4327, BotRV: 0.0367, AllV: 0.2452 +[2026-01-29T22:33:20.178160Z] Loop 3450: Reg: 0.3506, AltReg: 0.5844, CorReg: 0.0000, TopReg: 0.3643, AllReg: 0.5844, BotRReg: 0.7599, OV: 0.4531, AltV: 0.2452, CorV: 0.7651, TopV: 0.4324, BotRV: 0.0368, AllV: 0.2452 +[2026-01-29T22:33:31.851336Z] Loop 3460: Reg: 0.3506, AltReg: 0.5844, CorReg: 0.0000, TopReg: 0.3646, AllReg: 0.5844, BotRReg: 0.7599, OV: 0.4531, AltV: 0.2451, CorV: 0.7651, TopV: 0.4321, BotRV: 0.0368, AllV: 0.2451 +[2026-01-29T22:33:43.519698Z] Loop 3470: Reg: 0.3507, AltReg: 0.5845, CorReg: 0.0000, TopReg: 0.3655, AllReg: 0.5845, BotRReg: 0.7598, OV: 0.4531, AltV: 0.2451, CorV: 0.7651, TopV: 0.4312, BotRV: 0.0369, AllV: 0.2451 +[2026-01-29T22:33:55.192534Z] Loop 3480: Reg: 0.3506, AltReg: 0.5843, CorReg: 0.0000, TopReg: 0.3623, AllReg: 0.5843, BotRReg: 0.7607, OV: 0.4532, AltV: 0.2453, CorV: 0.7651, TopV: 0.4344, BotRV: 0.0360, AllV: 0.2453 +[2026-01-29T22:34:06.850746Z] Loop 3490: Reg: 0.3507, AltReg: 0.5844, CorReg: 0.0000, TopReg: 0.3620, AllReg: 0.5844, BotRReg: 0.7611, OV: 0.4531, AltV: 0.2451, CorV: 0.7651, TopV: 0.4347, BotRV: 0.0356, AllV: 0.2451 +[2026-01-29T22:34:18.506037Z] Loop 3500: Reg: 0.3515, AltReg: 0.5858, CorReg: 0.0000, TopReg: 0.3620, AllReg: 0.5858, BotRReg: 0.7630, OV: 0.4523, AltV: 0.2437, CorV: 0.7651, TopV: 0.4347, BotRV: 0.0337, AllV: 0.2437 +[2026-01-29T22:34:30.170113Z] Loop 3510: Reg: 0.3508, AltReg: 0.5846, CorReg: 0.0000, TopReg: 0.3624, AllReg: 0.5846, BotRReg: 0.7612, OV: 0.4530, AltV: 0.2449, CorV: 0.7651, TopV: 0.4342, BotRV: 0.0355, AllV: 0.2449 +[2026-01-29T22:34:41.831143Z] Loop 3520: Reg: 0.3512, AltReg: 0.5853, CorReg: 0.0000, TopReg: 0.3659, AllReg: 0.5853, BotRReg: 0.7610, OV: 0.4526, AltV: 0.2442, CorV: 0.7651, TopV: 0.4308, BotRV: 0.0357, AllV: 0.2442 +[2026-01-29T22:34:53.500891Z] Loop 3530: Reg: 0.3513, AltReg: 0.5854, CorReg: 0.0000, TopReg: 0.3645, AllReg: 0.5854, BotRReg: 0.7619, OV: 0.4525, AltV: 0.2441, CorV: 0.7651, TopV: 0.4321, BotRV: 0.0347, AllV: 0.2441 +[2026-01-29T22:35:05.171719Z] Loop 3540: Reg: 0.3517, AltReg: 0.5861, CorReg: 0.0000, TopReg: 0.3630, AllReg: 0.5861, BotRReg: 0.7627, OV: 0.4521, AltV: 0.2434, CorV: 0.7651, TopV: 0.4337, BotRV: 0.0340, AllV: 0.2434 +[2026-01-29T22:35:16.833900Z] Loop 3550: Reg: 0.3508, AltReg: 0.5846, CorReg: 0.0000, TopReg: 0.3648, AllReg: 0.5846, BotRReg: 0.7614, OV: 0.4530, AltV: 0.2449, CorV: 0.7651, TopV: 0.4319, BotRV: 0.0353, AllV: 0.2449 +[2026-01-29T22:35:28.495969Z] Loop 3560: Reg: 0.3509, AltReg: 0.5848, CorReg: 0.0000, TopReg: 0.3627, AllReg: 0.5848, BotRReg: 0.7625, OV: 0.4529, AltV: 0.2447, CorV: 0.7651, TopV: 0.4340, BotRV: 0.0342, AllV: 0.2447 +[2026-01-29T22:35:40.163227Z] Loop 3570: Reg: 0.3507, AltReg: 0.5845, CorReg: 0.0000, TopReg: 0.3627, AllReg: 0.5845, BotRReg: 0.7620, OV: 0.4531, AltV: 0.2450, CorV: 0.7651, TopV: 0.4340, BotRV: 0.0347, AllV: 0.2450 +[2026-01-29T22:35:51.824720Z] Loop 3580: Reg: 0.3507, AltReg: 0.5844, CorReg: 0.0000, TopReg: 0.3629, AllReg: 0.5844, BotRReg: 0.7615, OV: 0.4531, AltV: 0.2451, CorV: 0.7651, TopV: 0.4338, BotRV: 0.0352, AllV: 0.2451 +[2026-01-29T22:36:03.485117Z] Loop 3590: Reg: 0.3507, AltReg: 0.5845, CorReg: 0.0000, TopReg: 0.3624, AllReg: 0.5845, BotRReg: 0.7622, OV: 0.4531, AltV: 0.2450, CorV: 0.7651, TopV: 0.4343, BotRV: 0.0345, AllV: 0.2450 +[2026-01-29T22:36:15.139895Z] Loop 3600: Reg: 0.3506, AltReg: 0.5844, CorReg: 0.0000, TopReg: 0.3624, AllReg: 0.5844, BotRReg: 0.7615, OV: 0.4531, AltV: 0.2452, CorV: 0.7651, TopV: 0.4343, BotRV: 0.0352, AllV: 0.2452 +[2026-01-29T22:36:26.807252Z] Loop 3610: Reg: 0.3507, AltReg: 0.5845, CorReg: 0.0000, TopReg: 0.3623, AllReg: 0.5845, BotRReg: 0.7621, OV: 0.4531, AltV: 0.2451, CorV: 0.7651, TopV: 0.4344, BotRV: 0.0346, AllV: 0.2451 +[2026-01-29T22:36:38.486425Z] Loop 3620: Reg: 0.3557, AltReg: 0.5928, CorReg: 0.0001, TopReg: 0.3629, AllReg: 0.5928, BotRReg: 0.7665, OV: 0.4481, AltV: 0.2368, CorV: 0.7650, TopV: 0.4338, BotRV: 0.0302, AllV: 0.2368 +[2026-01-29T22:36:50.147645Z] Loop 3630: Reg: 0.3522, AltReg: 0.5870, CorReg: 0.0000, TopReg: 0.3619, AllReg: 0.5870, BotRReg: 0.7645, OV: 0.4516, AltV: 0.2425, CorV: 0.7651, TopV: 0.4348, BotRV: 0.0322, AllV: 0.2425 +[2026-01-29T22:37:01.810077Z] Loop 3640: Reg: 0.3508, AltReg: 0.5846, CorReg: 0.0000, TopReg: 0.3621, AllReg: 0.5846, BotRReg: 0.7623, OV: 0.4530, AltV: 0.2449, CorV: 0.7651, TopV: 0.4346, BotRV: 0.0344, AllV: 0.2449 +[2026-01-29T22:37:13.467923Z] Loop 3650: Reg: 0.3507, AltReg: 0.5846, CorReg: 0.0000, TopReg: 0.3624, AllReg: 0.5846, BotRReg: 0.7623, OV: 0.4530, AltV: 0.2450, CorV: 0.7651, TopV: 0.4343, BotRV: 0.0344, AllV: 0.2450 +[2026-01-29T22:37:25.122900Z] Loop 3660: Reg: 0.3507, AltReg: 0.5845, CorReg: 0.0000, TopReg: 0.3630, AllReg: 0.5845, BotRReg: 0.7620, OV: 0.4531, AltV: 0.2451, CorV: 0.7651, TopV: 0.4336, BotRV: 0.0347, AllV: 0.2451 +[2026-01-29T22:37:36.777726Z] Loop 3670: Reg: 0.3516, AltReg: 0.5861, CorReg: 0.0000, TopReg: 0.3619, AllReg: 0.5861, BotRReg: 0.7635, OV: 0.4521, AltV: 0.2435, CorV: 0.7651, TopV: 0.4348, BotRV: 0.0332, AllV: 0.2435 +[2026-01-29T22:37:48.432826Z] Loop 3680: Reg: 0.3511, AltReg: 0.5851, CorReg: 0.0000, TopReg: 0.3628, AllReg: 0.5851, BotRReg: 0.7627, OV: 0.4527, AltV: 0.2445, CorV: 0.7651, TopV: 0.4339, BotRV: 0.0340, AllV: 0.2445 +[2026-01-29T22:38:00.089391Z] Loop 3690: Reg: 0.3534, AltReg: 0.5890, CorReg: 0.0000, TopReg: 0.3620, AllReg: 0.5890, BotRReg: 0.7644, OV: 0.4504, AltV: 0.2405, CorV: 0.7651, TopV: 0.4347, BotRV: 0.0323, AllV: 0.2405 +[2026-01-29T22:38:11.752506Z] Loop 3700: Reg: 0.3556, AltReg: 0.5927, CorReg: 0.0000, TopReg: 0.3619, AllReg: 0.5927, BotRReg: 0.7665, OV: 0.4482, AltV: 0.2369, CorV: 0.7651, TopV: 0.4348, BotRV: 0.0302, AllV: 0.2369 +[2026-01-29T22:38:23.403436Z] Loop 3710: Reg: 0.3511, AltReg: 0.5851, CorReg: 0.0000, TopReg: 0.3622, AllReg: 0.5851, BotRReg: 0.7626, OV: 0.4527, AltV: 0.2444, CorV: 0.7651, TopV: 0.4344, BotRV: 0.0341, AllV: 0.2444 +[2026-01-29T22:38:35.061937Z] Loop 3720: Reg: 0.3510, AltReg: 0.5849, CorReg: 0.0000, TopReg: 0.3690, AllReg: 0.5849, BotRReg: 0.7597, OV: 0.4528, AltV: 0.2446, CorV: 0.7651, TopV: 0.4277, BotRV: 0.0369, AllV: 0.2446 +[2026-01-29T22:38:46.720570Z] Loop 3730: Reg: 0.3517, AltReg: 0.5862, CorReg: 0.0000, TopReg: 0.3752, AllReg: 0.5862, BotRReg: 0.7589, OV: 0.4520, AltV: 0.2433, CorV: 0.7651, TopV: 0.4215, BotRV: 0.0378, AllV: 0.2433 +[2026-01-29T22:38:58.392892Z] Loop 3740: Reg: 0.3526, AltReg: 0.5868, CorReg: 0.0012, TopReg: 0.3764, AllReg: 0.5868, BotRReg: 0.7590, OV: 0.4512, AltV: 0.2427, CorV: 0.7639, TopV: 0.4203, BotRV: 0.0377, AllV: 0.2427 +[2026-01-29T22:39:10.059180Z] Loop 3750: Reg: 0.3510, AltReg: 0.5849, CorReg: 0.0000, TopReg: 0.3695, AllReg: 0.5849, BotRReg: 0.7597, OV: 0.4528, AltV: 0.2446, CorV: 0.7651, TopV: 0.4272, BotRV: 0.0370, AllV: 0.2446 +[2026-01-29T22:39:21.719105Z] Loop 3760: Reg: 0.3507, AltReg: 0.5844, CorReg: 0.0000, TopReg: 0.3645, AllReg: 0.5844, BotRReg: 0.7599, OV: 0.4531, AltV: 0.2451, CorV: 0.7651, TopV: 0.4321, BotRV: 0.0368, AllV: 0.2451 diff --git a/al_0.6_g_0.97_id_11_seed_970611/latest_train.json b/al_0.6_g_0.97_id_11_seed_970611/latest_train.json new file mode 100644 index 0000000000000000000000000000000000000000..163949bf9133066dadb855462d46bc58054d5c23 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/latest_train.json @@ -0,0 +1,12 @@ +{ + "ts": "2026-01-29T22:39:34.575946Z", + "loop": 3771, + "env_steps": 2317516799, + "loss": 0.0012540643801912665, + "avg_return": 0.45758190751075745, + "regret": 0.35057640075683594, + "entropy": 0.06041354313492775, + "lr": 5e-05, + "discount_rate": 0.97, + "num_rollout_steps": 64 +} \ No newline at end of file diff --git a/al_0.6_g_0.97_id_11_seed_970611/setup.json b/al_0.6_g_0.97_id_11_seed_970611/setup.json new file mode 100644 index 0000000000000000000000000000000000000000..1d64c04ae3b107b9c54121559952b80a2a6de976 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/setup.json @@ -0,0 +1,86 @@ +{ + "config": { + "rl_action": "train", + "num_rollout_steps": 64, + "lr": 5e-05, + "discount_rate": 0.97, + "eff_horizon": null, + "eval_every": 1, + "use_wandb": true, + "use_hf": true, + "use_log": true, + "num_total_env_steps": 10000000000, + "checkpoint": "al_0.6_g_0.97_id_11_seed_970611", + "render_sixel": false, + "sixel_idx": 60, + "seed": 970611, + "run_id": 11, + "seed_formula": "{int(discount_rate*100):02d}{int(alpha*10):02d}{run_id:02d}", + "mask_type": "first_episode", + "penalize_time": false, + "optim": "adam", + "live_monitor": false, + "use_bf16": false, + "deterministic": true, + "eval_schedule": "0:1,250:2,500:5,2000:10", + "grad_acc_per_chunk": 5, + "num_rollout_chunks": 1, + "cheese_loc": "any", + "env_rule": null, + "env_layout": "open", + "alpha": 0.6, + "env_size": 13, + "num_levels": 9600, + "f_str_ckpt": "al_{alpha}_g_{discount_rate}_id_{run_id}_seed_{seed}", + "wandb_project": "jaxgmg2_3phase_unique", + "ckpt_dir": "jaxgmg2_3phase_unique", + "duplication_factor": -1, + "smoke": false, + "compile": true, + "num_chains": 6, + "num_draws": 3000, + "num_steps_bw_draws": 1, + "on_policy": true, + "llc_nbeta": 3000, + "localization": 10, + "exact_solver_each_draw": false, + "llc_optimizer": "sgld", + "iw_clip_eps": null, + "rmsprop_burnin_steps": 20, + "llc_data_file": "llc_scan_open_reinforce.pkl", + "llc_checkpoint_index": null, + "llc_checkpoint_number": null, + "sink": null, + "repo_id": "davidquarel/jaxgmg_ckpt_zip", + "use_shuffled_checkpoints": false, + "force_re_download": false, + "off_distribution_data": false, + "weight_restrictions": null, + "weight_restrictions_invert": false, + "evaluate_every_position": false, + "num_prev_actions": 1, + "ntfy": "david_jaxgmg", + "vis_average_state": false, + "trim_episodes": true, + "use_prev_action": false, + "ckpt_path": "jaxgmg2_3phase_unique/al_0.6_g_0.97_id_11_seed_970611", + "env_steps_per_loop": 614400, + "total_loops": 16276, + "eff_acc_steps": 5, + "env_steps_per_microbatch": 122880, + "chunk_size": 9600 + }, + "setup": { + "start_time_utc": "2026-01-29T21:25:28.015170Z", + "seed": 970611, + "device": "cuda", + "python_version": "3.11.11", + "torch_version": "2.10.0+cu128", + "jax_version": "0.6.2", + "hostname": "24587d833a07", + "platform": "Linux-6.8.0-90-generic-x86_64-with-glibc2.35", + "git_sha": null, + "git_branch": null, + "use_wandb": true + } +} \ No newline at end of file diff --git a/al_0.6_g_0.97_id_11_seed_970611/setup.txt b/al_0.6_g_0.97_id_11_seed_970611/setup.txt new file mode 100644 index 0000000000000000000000000000000000000000..8a8fbf72bba3399ea592da901fe1e4c51194ee7c --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/setup.txt @@ -0,0 +1,8 @@ +Start: 2026-01-29T21:25:28.015170Z +Seed: 970611 +Device: cuda +Python: 3.11.11 | Torch: 2.10.0+cu128 | JAX: 0.6.2 +Host: 24587d833a07 +Platform: Linux-6.8.0-90-generic-x86_64-with-glibc2.35 +Git: branch=None sha=None +use_wandb: True diff --git a/al_0.6_g_0.97_id_11_seed_970611/train.jsonl b/al_0.6_g_0.97_id_11_seed_970611/train.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..3caf6e755d7c43d8e42c015e3cedc96ead2ad0da --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/train.jsonl @@ -0,0 +1,3769 @@ +{"ts": "2026-01-29T21:25:57.840988Z", "loop": 0, "env_steps": 614399, "loss": 0.014129042625427246, "avg_return": 0.08706724643707275, "regret": 0.7079524993896484, "entropy": 1.3862768411636353, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:25:59.054150Z", "loop": 1, "env_steps": 1228799, "loss": 0.014178085140883923, "avg_return": 0.08504888415336609, "regret": 0.707631528377533, "entropy": 1.3862823247909546, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:26:00.265894Z", "loop": 2, "env_steps": 1843199, "loss": 0.013395698741078377, "avg_return": 0.08465930819511414, "regret": 0.7073216438293457, "entropy": 1.3862849473953247, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:26:01.473350Z", "loop": 3, "env_steps": 2457599, "loss": 0.014351661317050457, "avg_return": 0.09428062289953232, "regret": 0.7070201635360718, "entropy": 1.3862844705581665, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:26:02.676328Z", "loop": 4, "env_steps": 3071999, "loss": 0.014082716777920723, "avg_return": 0.08933772891759872, "regret": 0.7067158222198486, "entropy": 1.3862812519073486, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:26:03.880329Z", "loop": 5, "env_steps": 3686399, "loss": 0.014080457389354706, "avg_return": 0.09066937863826752, "regret": 0.7064108848571777, "entropy": 1.3862755298614502, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:26:05.094812Z", "loop": 6, "env_steps": 4300799, "loss": 0.014788617379963398, "avg_return": 0.08879382163286209, "regret": 0.7061117887496948, "entropy": 1.3862669467926025, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:26:06.310786Z", "loop": 7, "env_steps": 4915199, "loss": 0.013912667520344257, "avg_return": 0.08961869776248932, "regret": 0.7058216333389282, "entropy": 1.386256456375122, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:26:07.521493Z", "loop": 8, "env_steps": 5529599, "loss": 0.015655381605029106, "avg_return": 0.08949364721775055, "regret": 0.7055338621139526, "entropy": 1.3862435817718506, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:26:08.724719Z", "loop": 9, "env_steps": 6143999, "loss": 0.016463426873087883, "avg_return": 0.09282553941011429, "regret": 0.7052397131919861, "entropy": 1.3862282037734985, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:26:09.929209Z", "loop": 10, "env_steps": 6758399, "loss": 0.016777334734797478, "avg_return": 0.09353379160165787, "regret": 0.7049384117126465, "entropy": 1.3862100839614868, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:26:11.131732Z", "loop": 11, "env_steps": 7372799, "loss": 0.015137048438191414, "avg_return": 0.09077730029821396, "regret": 0.704624354839325, "entropy": 1.3861887454986572, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:26:12.339013Z", "loop": 12, "env_steps": 7987199, "loss": 0.013955304399132729, "avg_return": 0.08853396028280258, "regret": 0.7042970061302185, "entropy": 1.3861639499664307, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:26:13.548955Z", "loop": 13, "env_steps": 8601599, "loss": 0.014399188570678234, "avg_return": 0.09315143525600433, "regret": 0.7039568424224854, "entropy": 1.3861356973648071, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:26:14.757499Z", "loop": 14, "env_steps": 9215999, "loss": 0.01616486720740795, "avg_return": 0.09348779171705246, "regret": 0.7036070823669434, "entropy": 1.3861035108566284, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:26:15.962940Z", "loop": 15, "env_steps": 9830399, "loss": 0.015051953494548798, "avg_return": 0.09202273935079575, "regret": 0.7032424211502075, "entropy": 1.3860671520233154, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:26:17.165342Z", "loop": 16, "env_steps": 10444799, "loss": 0.014127626083791256, "avg_return": 0.08952413499355316, "regret": 0.7028632760047913, "entropy": 1.3860257863998413, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:26:18.373136Z", "loop": 17, "env_steps": 11059199, "loss": 0.016016768291592598, "avg_return": 0.093620166182518, "regret": 0.7024667263031006, "entropy": 1.3859790563583374, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:26:19.578404Z", "loop": 18, "env_steps": 11673599, "loss": 0.015074721537530422, "avg_return": 0.09134333580732346, "regret": 0.7020548582077026, "entropy": 1.385927438735962, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:26:20.783615Z", "loop": 19, "env_steps": 12287999, "loss": 0.01540676411241293, "avg_return": 0.08851701021194458, "regret": 0.7016264200210571, "entropy": 1.3858686685562134, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:26:21.993224Z", "loop": 20, "env_steps": 12902399, "loss": 0.014999672770500183, "avg_return": 0.09290270507335663, "regret": 0.7011767625808716, "entropy": 1.385804295539856, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:26:23.202091Z", "loop": 21, "env_steps": 13516799, "loss": 0.014691263437271118, "avg_return": 0.08776716142892838, "regret": 0.7007043361663818, "entropy": 1.3857321739196777, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:26:24.409810Z", "loop": 22, "env_steps": 14131199, "loss": 0.014913985505700111, "avg_return": 0.09668470919132233, "regret": 0.7002131938934326, "entropy": 1.385652780532837, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:26:25.612713Z", "loop": 23, "env_steps": 14745599, "loss": 0.015793006867170334, "avg_return": 0.0924314334988594, "regret": 0.6996974349021912, "entropy": 1.3855652809143066, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:26:26.815895Z", "loop": 24, "env_steps": 15359999, "loss": 0.01440458931028843, "avg_return": 0.09308800101280212, "regret": 0.6991506814956665, "entropy": 1.3854663372039795, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:26:28.017873Z", "loop": 25, "env_steps": 15974399, "loss": 0.01610620878636837, "avg_return": 0.09800080955028534, "regret": 0.6985790729522705, "entropy": 1.385358214378357, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:26:29.217839Z", "loop": 26, "env_steps": 16588799, "loss": 0.016004731878638268, "avg_return": 0.0978103056550026, "regret": 0.6979695558547974, "entropy": 1.3852362632751465, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:26:30.427831Z", "loop": 27, "env_steps": 17203199, "loss": 0.016060620546340942, "avg_return": 0.09821394830942154, "regret": 0.697311282157898, "entropy": 1.3850985765457153, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:26:31.630408Z", "loop": 28, "env_steps": 17817599, "loss": 0.017175430431962013, "avg_return": 0.09233951568603516, "regret": 0.6966090202331543, "entropy": 1.3849434852600098, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:26:32.832097Z", "loop": 29, "env_steps": 18431999, "loss": 0.01686941273510456, "avg_return": 0.09658286720514297, "regret": 0.6958577036857605, "entropy": 1.3847700357437134, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:26:34.038186Z", "loop": 30, "env_steps": 19046399, "loss": 0.01836623065173626, "avg_return": 0.09599792957305908, "regret": 0.6950529217720032, "entropy": 1.3845726251602173, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:26:35.242256Z", "loop": 31, "env_steps": 19660799, "loss": 0.017365925014019012, "avg_return": 0.09707308560609818, "regret": 0.6941866874694824, "entropy": 1.3843517303466797, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:26:36.447404Z", "loop": 32, "env_steps": 20275199, "loss": 0.016309401020407677, "avg_return": 0.09855113923549652, "regret": 0.6932559013366699, "entropy": 1.384103775024414, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:26:37.651271Z", "loop": 33, "env_steps": 20889599, "loss": 0.01806154102087021, "avg_return": 0.09707745164632797, "regret": 0.6922589540481567, "entropy": 1.3838242292404175, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:26:38.853158Z", "loop": 34, "env_steps": 21503999, "loss": 0.017249232158064842, "avg_return": 0.10137561708688736, "regret": 0.6911920309066772, "entropy": 1.3835129737854004, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:26:40.056461Z", "loop": 35, "env_steps": 22118399, "loss": 0.016624871641397476, "avg_return": 0.1033114492893219, "regret": 0.690089225769043, "entropy": 1.3831756114959717, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:26:41.261046Z", "loop": 36, "env_steps": 22732799, "loss": 0.019373880699276924, "avg_return": 0.10358206182718277, "regret": 0.6889081001281738, "entropy": 1.3828011751174927, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:26:42.467552Z", "loop": 37, "env_steps": 23347199, "loss": 0.019947508350014687, "avg_return": 0.1023392379283905, "regret": 0.6876395344734192, "entropy": 1.3823800086975098, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:26:43.670186Z", "loop": 38, "env_steps": 23961599, "loss": 0.01708204485476017, "avg_return": 0.10440367460250854, "regret": 0.6862614154815674, "entropy": 1.381905198097229, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:26:44.872976Z", "loop": 39, "env_steps": 24575999, "loss": 0.02107463963329792, "avg_return": 0.10799109190702438, "regret": 0.6847628355026245, "entropy": 1.3813655376434326, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:26:46.074852Z", "loop": 40, "env_steps": 25190399, "loss": 0.019911400973796844, "avg_return": 0.11038494110107422, "regret": 0.6831387281417847, "entropy": 1.380755066871643, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:26:47.277221Z", "loop": 41, "env_steps": 25804799, "loss": 0.01891486532986164, "avg_return": 0.10618302971124649, "regret": 0.6813806295394897, "entropy": 1.3800652027130127, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:26:48.479121Z", "loop": 42, "env_steps": 26419199, "loss": 0.02124996855854988, "avg_return": 0.11119896173477173, "regret": 0.6794573068618774, "entropy": 1.3792715072631836, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:26:49.681508Z", "loop": 43, "env_steps": 27033599, "loss": 0.02117270976305008, "avg_return": 0.11200742423534393, "regret": 0.6773385405540466, "entropy": 1.3783618211746216, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:26:50.883412Z", "loop": 44, "env_steps": 27647999, "loss": 0.02220248430967331, "avg_return": 0.11879359185695648, "regret": 0.6750146746635437, "entropy": 1.3773219585418701, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:26:52.086313Z", "loop": 45, "env_steps": 28262399, "loss": 0.02315388061106205, "avg_return": 0.11865399032831192, "regret": 0.6724823713302612, "entropy": 1.3761389255523682, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:26:53.288310Z", "loop": 46, "env_steps": 28876799, "loss": 0.022104239091277122, "avg_return": 0.12167048454284668, "regret": 0.669716477394104, "entropy": 1.3747831583023071, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:26:54.490079Z", "loop": 47, "env_steps": 29491199, "loss": 0.022808564826846123, "avg_return": 0.12313500791788101, "regret": 0.6666913032531738, "entropy": 1.3732339143753052, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:26:55.694363Z", "loop": 48, "env_steps": 30105599, "loss": 0.024917438626289368, "avg_return": 0.12672165036201477, "regret": 0.6634023189544678, "entropy": 1.3714518547058105, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:26:56.898257Z", "loop": 49, "env_steps": 30719999, "loss": 0.02508433163166046, "avg_return": 0.1307663768529892, "regret": 0.6598055958747864, "entropy": 1.3694088459014893, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:26:58.103325Z", "loop": 50, "env_steps": 31334399, "loss": 0.02638906240463257, "avg_return": 0.135484978556633, "regret": 0.6558685302734375, "entropy": 1.3670071363449097, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:26:59.306270Z", "loop": 51, "env_steps": 31948799, "loss": 0.028095874935388565, "avg_return": 0.1382497102022171, "regret": 0.6515657901763916, "entropy": 1.3642584085464478, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:27:00.507528Z", "loop": 52, "env_steps": 32563199, "loss": 0.02757534384727478, "avg_return": 0.14027170836925507, "regret": 0.646894633769989, "entropy": 1.361070156097412, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:27:01.708423Z", "loop": 53, "env_steps": 33177599, "loss": 0.029142916202545166, "avg_return": 0.14236560463905334, "regret": 0.6418265700340271, "entropy": 1.357362151145935, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:27:02.914261Z", "loop": 54, "env_steps": 33791999, "loss": 0.03174120560288429, "avg_return": 0.1513567864894867, "regret": 0.6363353729248047, "entropy": 1.3530349731445312, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:27:04.117935Z", "loop": 55, "env_steps": 34406399, "loss": 0.033923085778951645, "avg_return": 0.1615358293056488, "regret": 0.6304646730422974, "entropy": 1.3480656147003174, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:27:05.320335Z", "loop": 56, "env_steps": 35020799, "loss": 0.03460516408085823, "avg_return": 0.16668292880058289, "regret": 0.6242214441299438, "entropy": 1.3422788381576538, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:27:06.521962Z", "loop": 57, "env_steps": 35635199, "loss": 0.03550935536623001, "avg_return": 0.1751323789358139, "regret": 0.6176434755325317, "entropy": 1.3356022834777832, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:27:07.725152Z", "loop": 58, "env_steps": 36249599, "loss": 0.04046841338276863, "avg_return": 0.18549494445323944, "regret": 0.6107183694839478, "entropy": 1.3279038667678833, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:27:08.930186Z", "loop": 59, "env_steps": 36863999, "loss": 0.04001924768090248, "avg_return": 0.1888372153043747, "regret": 0.6035044193267822, "entropy": 1.3189510107040405, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:27:10.132797Z", "loop": 60, "env_steps": 37478399, "loss": 0.04197883605957031, "avg_return": 0.19644862413406372, "regret": 0.5960818529129028, "entropy": 1.3086650371551514, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:27:11.335028Z", "loop": 61, "env_steps": 38092799, "loss": 0.043042898178100586, "avg_return": 0.20672988891601562, "regret": 0.5885549783706665, "entropy": 1.2968465089797974, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:27:12.538352Z", "loop": 62, "env_steps": 38707199, "loss": 0.044028569012880325, "avg_return": 0.21523518860340118, "regret": 0.5809752941131592, "entropy": 1.2834631204605103, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:27:13.742864Z", "loop": 63, "env_steps": 39321599, "loss": 0.04088978469371796, "avg_return": 0.22607681155204773, "regret": 0.5734766721725464, "entropy": 1.2681864500045776, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:27:14.945594Z", "loop": 64, "env_steps": 39935999, "loss": 0.0421203188598156, "avg_return": 0.23156499862670898, "regret": 0.5660926103591919, "entropy": 1.25106942653656, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:27:16.149199Z", "loop": 65, "env_steps": 40550399, "loss": 0.04306836053729057, "avg_return": 0.24281245470046997, "regret": 0.5589349269866943, "entropy": 1.23192298412323, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:27:17.353363Z", "loop": 66, "env_steps": 41164799, "loss": 0.04051661118865013, "avg_return": 0.24728216230869293, "regret": 0.552074670791626, "entropy": 1.2106833457946777, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:27:18.556520Z", "loop": 67, "env_steps": 41779199, "loss": 0.03972778469324112, "avg_return": 0.26001647114753723, "regret": 0.5456316471099854, "entropy": 1.187791109085083, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:27:19.759204Z", "loop": 68, "env_steps": 42393599, "loss": 0.03739207983016968, "avg_return": 0.26436591148376465, "regret": 0.5396623611450195, "entropy": 1.1634550094604492, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:27:20.968300Z", "loop": 69, "env_steps": 43007999, "loss": 0.03520260378718376, "avg_return": 0.2630080282688141, "regret": 0.5341866612434387, "entropy": 1.1378116607666016, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:27:22.171019Z", "loop": 70, "env_steps": 43622399, "loss": 0.03479066118597984, "avg_return": 0.27817991375923157, "regret": 0.5291553735733032, "entropy": 1.111043095588684, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:27:23.374017Z", "loop": 71, "env_steps": 44236799, "loss": 0.03201454132795334, "avg_return": 0.2809179127216339, "regret": 0.5246288776397705, "entropy": 1.0840649604797363, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:27:24.578499Z", "loop": 72, "env_steps": 44851199, "loss": 0.030794544145464897, "avg_return": 0.27894607186317444, "regret": 0.5205925107002258, "entropy": 1.0564998388290405, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:27:25.784153Z", "loop": 73, "env_steps": 45465599, "loss": 0.03061598353087902, "avg_return": 0.28147923946380615, "regret": 0.5169867277145386, "entropy": 1.0293796062469482, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:27:26.987191Z", "loop": 74, "env_steps": 46079999, "loss": 0.030116913840174675, "avg_return": 0.2906542718410492, "regret": 0.5137888789176941, "entropy": 1.0026706457138062, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:27:28.194186Z", "loop": 75, "env_steps": 46694399, "loss": 0.026453746482729912, "avg_return": 0.292578786611557, "regret": 0.5109825730323792, "entropy": 0.976474404335022, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:27:29.397946Z", "loop": 76, "env_steps": 47308799, "loss": 0.027383917942643166, "avg_return": 0.3001173138618469, "regret": 0.5085097551345825, "entropy": 0.9518378376960754, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:27:30.601947Z", "loop": 77, "env_steps": 47923199, "loss": 0.02354319952428341, "avg_return": 0.2880963385105133, "regret": 0.5063032507896423, "entropy": 0.9286284446716309, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:27:31.805055Z", "loop": 78, "env_steps": 48537599, "loss": 0.02454504370689392, "avg_return": 0.2981586158275604, "regret": 0.5043855905532837, "entropy": 0.9070124626159668, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:27:33.008915Z", "loop": 79, "env_steps": 49151999, "loss": 0.023354852572083473, "avg_return": 0.29987797141075134, "regret": 0.5026982426643372, "entropy": 0.8875803351402283, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:27:34.213905Z", "loop": 80, "env_steps": 49766399, "loss": 0.021791234612464905, "avg_return": 0.2985489070415497, "regret": 0.5012025833129883, "entropy": 0.869751513004303, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:27:35.452786Z", "loop": 81, "env_steps": 50380799, "loss": 0.021304668858647346, "avg_return": 0.29816752672195435, "regret": 0.4998868703842163, "entropy": 0.8528831005096436, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:27:36.659298Z", "loop": 82, "env_steps": 50995199, "loss": 0.020905014127492905, "avg_return": 0.30613183975219727, "regret": 0.4987410008907318, "entropy": 0.8376471996307373, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:27:37.862669Z", "loop": 83, "env_steps": 51609599, "loss": 0.019269948825240135, "avg_return": 0.3012502193450928, "regret": 0.49778398871421814, "entropy": 0.8237200975418091, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:27:39.068288Z", "loop": 84, "env_steps": 52223999, "loss": 0.020541787147521973, "avg_return": 0.3067135214805603, "regret": 0.4970187544822693, "entropy": 0.8112440705299377, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:27:40.276797Z", "loop": 85, "env_steps": 52838399, "loss": 0.019525637850165367, "avg_return": 0.30500268936157227, "regret": 0.4964349865913391, "entropy": 0.8002641201019287, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:27:41.479876Z", "loop": 86, "env_steps": 53452799, "loss": 0.018764836713671684, "avg_return": 0.31089159846305847, "regret": 0.49599689245224, "entropy": 0.7904478311538696, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:27:42.684158Z", "loop": 87, "env_steps": 54067199, "loss": 0.019111698493361473, "avg_return": 0.3107663691043854, "regret": 0.49569565057754517, "entropy": 0.781510055065155, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:27:43.886695Z", "loop": 88, "env_steps": 54681599, "loss": 0.019413752481341362, "avg_return": 0.3161516785621643, "regret": 0.4955465495586395, "entropy": 0.773065984249115, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:27:45.092323Z", "loop": 89, "env_steps": 55295999, "loss": 0.01823318749666214, "avg_return": 0.30642277002334595, "regret": 0.49540647864341736, "entropy": 0.7657985091209412, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:27:46.296765Z", "loop": 90, "env_steps": 55910399, "loss": 0.019764138385653496, "avg_return": 0.30773723125457764, "regret": 0.4952089488506317, "entropy": 0.7592382431030273, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:27:47.501234Z", "loop": 91, "env_steps": 56524799, "loss": 0.01824522577226162, "avg_return": 0.31033068895339966, "regret": 0.4949752688407898, "entropy": 0.7536996603012085, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:27:48.709350Z", "loop": 92, "env_steps": 57139199, "loss": 0.019681155681610107, "avg_return": 0.3120959997177124, "regret": 0.49469006061553955, "entropy": 0.74897301197052, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:27:49.918912Z", "loop": 93, "env_steps": 57753599, "loss": 0.018980706110596657, "avg_return": 0.30936163663864136, "regret": 0.4943869113922119, "entropy": 0.7449803948402405, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:27:51.124894Z", "loop": 94, "env_steps": 58367999, "loss": 0.016393262892961502, "avg_return": 0.30739253759384155, "regret": 0.4941021203994751, "entropy": 0.7415475845336914, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:27:52.330244Z", "loop": 95, "env_steps": 58982399, "loss": 0.01701163314282894, "avg_return": 0.3070433735847473, "regret": 0.4938914179801941, "entropy": 0.7383949756622314, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:27:53.534439Z", "loop": 96, "env_steps": 59596799, "loss": 0.01821742206811905, "avg_return": 0.30649012327194214, "regret": 0.4937458038330078, "entropy": 0.7357044219970703, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:27:54.737886Z", "loop": 97, "env_steps": 60211199, "loss": 0.01793178729712963, "avg_return": 0.31032827496528625, "regret": 0.49373236298561096, "entropy": 0.7327953577041626, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:27:55.942535Z", "loop": 98, "env_steps": 60825599, "loss": 0.017261719331145287, "avg_return": 0.30937403440475464, "regret": 0.49386537075042725, "entropy": 0.7297813892364502, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:27:57.146729Z", "loop": 99, "env_steps": 61439999, "loss": 0.017658431082963943, "avg_return": 0.3136953115463257, "regret": 0.4940629303455353, "entropy": 0.7265244126319885, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:27:58.350582Z", "loop": 100, "env_steps": 62054399, "loss": 0.016799626871943474, "avg_return": 0.312904417514801, "regret": 0.4942740201950073, "entropy": 0.7234395742416382, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:27:59.555484Z", "loop": 101, "env_steps": 62668799, "loss": 0.01808840036392212, "avg_return": 0.3135756552219391, "regret": 0.49431419372558594, "entropy": 0.7215321063995361, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:28:00.761468Z", "loop": 102, "env_steps": 63283199, "loss": 0.017861774191260338, "avg_return": 0.3127286434173584, "regret": 0.4941742420196533, "entropy": 0.7204887866973877, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:28:01.969668Z", "loop": 103, "env_steps": 63897599, "loss": 0.018012909218668938, "avg_return": 0.3083203434944153, "regret": 0.49395516514778137, "entropy": 0.7202035784721375, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:28:03.176508Z", "loop": 104, "env_steps": 64511999, "loss": 0.01694582961499691, "avg_return": 0.313003808259964, "regret": 0.49371856451034546, "entropy": 0.7200801968574524, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:28:04.377451Z", "loop": 105, "env_steps": 65126399, "loss": 0.017171576619148254, "avg_return": 0.3095787763595581, "regret": 0.493486225605011, "entropy": 0.7203542590141296, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:28:05.581798Z", "loop": 106, "env_steps": 65740799, "loss": 0.017158877104520798, "avg_return": 0.31342312693595886, "regret": 0.49330615997314453, "entropy": 0.720521092414856, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:28:06.785131Z", "loop": 107, "env_steps": 66355199, "loss": 0.019218966364860535, "avg_return": 0.3096945881843567, "regret": 0.49326005578041077, "entropy": 0.7203947901725769, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:28:07.996422Z", "loop": 108, "env_steps": 66969599, "loss": 0.01819661073386669, "avg_return": 0.30991876125335693, "regret": 0.4933302402496338, "entropy": 0.7198290824890137, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:28:09.202670Z", "loop": 109, "env_steps": 67583999, "loss": 0.016814855858683586, "avg_return": 0.3101175129413605, "regret": 0.4934418499469757, "entropy": 0.7191124558448792, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:28:10.404701Z", "loop": 110, "env_steps": 68198399, "loss": 0.017367364838719368, "avg_return": 0.3114738166332245, "regret": 0.4935818314552307, "entropy": 0.71834796667099, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:28:11.606239Z", "loop": 111, "env_steps": 68812799, "loss": 0.017330314964056015, "avg_return": 0.30178797245025635, "regret": 0.49370959401130676, "entropy": 0.7177040576934814, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:28:12.808391Z", "loop": 112, "env_steps": 69427199, "loss": 0.017040930688381195, "avg_return": 0.30939042568206787, "regret": 0.4938048720359802, "entropy": 0.7170820236206055, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:28:14.011675Z", "loop": 113, "env_steps": 70041599, "loss": 0.017498930916190147, "avg_return": 0.3108765482902527, "regret": 0.49394169449806213, "entropy": 0.7164073586463928, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:28:15.214542Z", "loop": 114, "env_steps": 70655999, "loss": 0.01827126368880272, "avg_return": 0.312713623046875, "regret": 0.4939528703689575, "entropy": 0.7161794304847717, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:28:16.417341Z", "loop": 115, "env_steps": 71270399, "loss": 0.017493033781647682, "avg_return": 0.3116387128829956, "regret": 0.49389928579330444, "entropy": 0.7158706784248352, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:28:17.618649Z", "loop": 116, "env_steps": 71884799, "loss": 0.017095820978283882, "avg_return": 0.30915847420692444, "regret": 0.4939020872116089, "entropy": 0.7152541279792786, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:28:18.822597Z", "loop": 117, "env_steps": 72499199, "loss": 0.017493490129709244, "avg_return": 0.3095298707485199, "regret": 0.49372363090515137, "entropy": 0.715282142162323, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:28:20.025685Z", "loop": 118, "env_steps": 73113599, "loss": 0.017226317897439003, "avg_return": 0.31058651208877563, "regret": 0.4935775101184845, "entropy": 0.7152285575866699, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:28:21.229120Z", "loop": 119, "env_steps": 73727999, "loss": 0.01700408197939396, "avg_return": 0.30555397272109985, "regret": 0.4933762550354004, "entropy": 0.7153573036193848, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:28:22.430973Z", "loop": 120, "env_steps": 74342399, "loss": 0.017894789576530457, "avg_return": 0.30905812978744507, "regret": 0.4931929409503937, "entropy": 0.7154725790023804, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:28:23.634202Z", "loop": 121, "env_steps": 74956799, "loss": 0.01666046306490898, "avg_return": 0.3079482614994049, "regret": 0.49310678243637085, "entropy": 0.7152920365333557, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:28:24.835766Z", "loop": 122, "env_steps": 75571199, "loss": 0.0173889622092247, "avg_return": 0.30297791957855225, "regret": 0.4931788146495819, "entropy": 0.7146117091178894, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:28:26.037712Z", "loop": 123, "env_steps": 76185599, "loss": 0.018222572281956673, "avg_return": 0.314075767993927, "regret": 0.4933878183364868, "entropy": 0.7135285139083862, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:28:27.238705Z", "loop": 124, "env_steps": 76799999, "loss": 0.017664646729826927, "avg_return": 0.30942806601524353, "regret": 0.4936809241771698, "entropy": 0.7122165560722351, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:28:28.445074Z", "loop": 125, "env_steps": 77414399, "loss": 0.016920387744903564, "avg_return": 0.30533942580223083, "regret": 0.49401795864105225, "entropy": 0.7107943296432495, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:28:29.648981Z", "loop": 126, "env_steps": 78028799, "loss": 0.016721991822123528, "avg_return": 0.30445626378059387, "regret": 0.49409544467926025, "entropy": 0.7104772329330444, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:28:30.853474Z", "loop": 127, "env_steps": 78643199, "loss": 0.01750444434583187, "avg_return": 0.3134925365447998, "regret": 0.49407124519348145, "entropy": 0.7103829383850098, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:28:32.056716Z", "loop": 128, "env_steps": 79257599, "loss": 0.01600201241672039, "avg_return": 0.3105675280094147, "regret": 0.4939561188220978, "entropy": 0.7106395363807678, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:28:33.261784Z", "loop": 129, "env_steps": 79871999, "loss": 0.017357563599944115, "avg_return": 0.3115985095500946, "regret": 0.4936799705028534, "entropy": 0.7115654349327087, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:28:34.465237Z", "loop": 130, "env_steps": 80486399, "loss": 0.018202481791377068, "avg_return": 0.3134877681732178, "regret": 0.4934276342391968, "entropy": 0.7123409509658813, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:28:35.668178Z", "loop": 131, "env_steps": 81100799, "loss": 0.016444411128759384, "avg_return": 0.3138244152069092, "regret": 0.49319708347320557, "entropy": 0.7131186723709106, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:28:36.871311Z", "loop": 132, "env_steps": 81715199, "loss": 0.016537969931960106, "avg_return": 0.3123178482055664, "regret": 0.4930993914604187, "entropy": 0.7132996320724487, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:28:38.076270Z", "loop": 133, "env_steps": 82329599, "loss": 0.01672731712460518, "avg_return": 0.3085731565952301, "regret": 0.49305030703544617, "entropy": 0.7133161425590515, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:28:39.280418Z", "loop": 134, "env_steps": 82943999, "loss": 0.01633267104625702, "avg_return": 0.3091382384300232, "regret": 0.4930863380432129, "entropy": 0.7130338549613953, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:28:40.485781Z", "loop": 135, "env_steps": 83558399, "loss": 0.016351351514458656, "avg_return": 0.31824126839637756, "regret": 0.4931637942790985, "entropy": 0.7126367092132568, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:28:41.690704Z", "loop": 136, "env_steps": 84172799, "loss": 0.01732131652534008, "avg_return": 0.3080804646015167, "regret": 0.49330615997314453, "entropy": 0.7120823264122009, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:28:42.896527Z", "loop": 137, "env_steps": 84787199, "loss": 0.0167227890342474, "avg_return": 0.3076965808868408, "regret": 0.4934050440788269, "entropy": 0.711700975894928, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:28:44.102064Z", "loop": 138, "env_steps": 85401599, "loss": 0.01720859669148922, "avg_return": 0.3139127194881439, "regret": 0.4934946596622467, "entropy": 0.7113039493560791, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:28:45.307803Z", "loop": 139, "env_steps": 86015999, "loss": 0.01613946072757244, "avg_return": 0.3125135004520416, "regret": 0.49355560541152954, "entropy": 0.7109799981117249, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:28:46.512059Z", "loop": 140, "env_steps": 86630399, "loss": 0.016749447211623192, "avg_return": 0.31201329827308655, "regret": 0.4934625029563904, "entropy": 0.7112659811973572, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:28:47.716877Z", "loop": 141, "env_steps": 87244799, "loss": 0.01716524362564087, "avg_return": 0.3088345229625702, "regret": 0.49328354001045227, "entropy": 0.7117775082588196, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:28:48.922412Z", "loop": 142, "env_steps": 87859199, "loss": 0.018525969237089157, "avg_return": 0.3140917122364044, "regret": 0.49312323331832886, "entropy": 0.7121977210044861, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:28:50.129258Z", "loop": 143, "env_steps": 88473599, "loss": 0.017009621486067772, "avg_return": 0.3052535057067871, "regret": 0.49303480982780457, "entropy": 0.7123929858207703, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:28:51.336262Z", "loop": 144, "env_steps": 89087999, "loss": 0.016882842406630516, "avg_return": 0.31437069177627563, "regret": 0.49304795265197754, "entropy": 0.712224006652832, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:28:52.540401Z", "loop": 145, "env_steps": 89702399, "loss": 0.015740854665637016, "avg_return": 0.3120180368423462, "regret": 0.4931216239929199, "entropy": 0.7118457555770874, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:28:53.753575Z", "loop": 146, "env_steps": 90316799, "loss": 0.017137175425887108, "avg_return": 0.3154595196247101, "regret": 0.493183434009552, "entropy": 0.7114993333816528, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:28:54.959877Z", "loop": 147, "env_steps": 90931199, "loss": 0.017398910596966743, "avg_return": 0.3086298704147339, "regret": 0.49323561787605286, "entropy": 0.7112463712692261, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:28:56.162985Z", "loop": 148, "env_steps": 91545599, "loss": 0.016450708732008934, "avg_return": 0.3127124607563019, "regret": 0.4932219386100769, "entropy": 0.7111546993255615, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:28:57.367774Z", "loop": 149, "env_steps": 92159999, "loss": 0.016083303838968277, "avg_return": 0.3145059645175934, "regret": 0.4931449890136719, "entropy": 0.711311399936676, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:28:58.575177Z", "loop": 150, "env_steps": 92774399, "loss": 0.017537027597427368, "avg_return": 0.3188283443450928, "regret": 0.49312257766723633, "entropy": 0.7111810445785522, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:28:59.780154Z", "loop": 151, "env_steps": 93388799, "loss": 0.01701260916888714, "avg_return": 0.31354162096977234, "regret": 0.49311694502830505, "entropy": 0.7109623551368713, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:29:00.983652Z", "loop": 152, "env_steps": 94003199, "loss": 0.015920063480734825, "avg_return": 0.3094465136528015, "regret": 0.4931029677391052, "entropy": 0.7109699845314026, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:29:02.196322Z", "loop": 153, "env_steps": 94617599, "loss": 0.017619488760828972, "avg_return": 0.307425856590271, "regret": 0.49308285117149353, "entropy": 0.7109020352363586, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:29:03.396965Z", "loop": 154, "env_steps": 95231999, "loss": 0.016138428822159767, "avg_return": 0.30190742015838623, "regret": 0.49304020404815674, "entropy": 0.7109590172767639, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:29:04.597869Z", "loop": 155, "env_steps": 95846399, "loss": 0.01664987951517105, "avg_return": 0.308857262134552, "regret": 0.49301397800445557, "entropy": 0.7110021114349365, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:29:05.797850Z", "loop": 156, "env_steps": 96460799, "loss": 0.01667764037847519, "avg_return": 0.30578431487083435, "regret": 0.4929899275302887, "entropy": 0.7109074592590332, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:29:06.998893Z", "loop": 157, "env_steps": 97075199, "loss": 0.015530404634773731, "avg_return": 0.3084154725074768, "regret": 0.4929787516593933, "entropy": 0.7107900381088257, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:29:08.200558Z", "loop": 158, "env_steps": 97689599, "loss": 0.016372065991163254, "avg_return": 0.3076711595058441, "regret": 0.49299174547195435, "entropy": 0.7105581164360046, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:29:09.400037Z", "loop": 159, "env_steps": 98303999, "loss": 0.017337974160909653, "avg_return": 0.3079046308994293, "regret": 0.4930219352245331, "entropy": 0.7101960182189941, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:29:10.599616Z", "loop": 160, "env_steps": 98918399, "loss": 0.016896042972803116, "avg_return": 0.3063569664955139, "regret": 0.49312517046928406, "entropy": 0.7096916437149048, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:29:11.801730Z", "loop": 161, "env_steps": 99532799, "loss": 0.01794848032295704, "avg_return": 0.31024348735809326, "regret": 0.49327516555786133, "entropy": 0.7089822888374329, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:29:13.004556Z", "loop": 162, "env_steps": 100147199, "loss": 0.018264584243297577, "avg_return": 0.31011733412742615, "regret": 0.4934920370578766, "entropy": 0.7080379724502563, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:29:14.211005Z", "loop": 163, "env_steps": 100761599, "loss": 0.0172381903976202, "avg_return": 0.30923914909362793, "regret": 0.49366724491119385, "entropy": 0.7072218656539917, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:29:15.415199Z", "loop": 164, "env_steps": 101375999, "loss": 0.017063995823264122, "avg_return": 0.3104473054409027, "regret": 0.49372398853302, "entropy": 0.7066841721534729, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:29:16.619511Z", "loop": 165, "env_steps": 101990399, "loss": 0.016392802819609642, "avg_return": 0.3117770552635193, "regret": 0.49368029832839966, "entropy": 0.7064669728279114, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:29:17.824733Z", "loop": 166, "env_steps": 102604799, "loss": 0.017838792875409126, "avg_return": 0.3170826733112335, "regret": 0.4933607578277588, "entropy": 0.7072015404701233, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:29:19.034186Z", "loop": 167, "env_steps": 103219199, "loss": 0.01762409321963787, "avg_return": 0.31052011251449585, "regret": 0.49313563108444214, "entropy": 0.7076947689056396, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:29:20.239530Z", "loop": 168, "env_steps": 103833599, "loss": 0.016596080735325813, "avg_return": 0.3140515089035034, "regret": 0.4929344058036804, "entropy": 0.7079691886901855, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:29:21.443891Z", "loop": 169, "env_steps": 104447999, "loss": 0.01731632463634014, "avg_return": 0.3105934262275696, "regret": 0.4929106831550598, "entropy": 0.7076781392097473, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:29:22.649634Z", "loop": 170, "env_steps": 105062399, "loss": 0.016060257330536842, "avg_return": 0.3103199899196625, "regret": 0.4930686056613922, "entropy": 0.7069272994995117, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:29:23.855078Z", "loop": 171, "env_steps": 105676799, "loss": 0.017878621816635132, "avg_return": 0.31445690989494324, "regret": 0.49327486753463745, "entropy": 0.7061225175857544, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:29:25.059294Z", "loop": 172, "env_steps": 106291199, "loss": 0.016257306560873985, "avg_return": 0.31631389260292053, "regret": 0.4934774339199066, "entropy": 0.7053757309913635, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:29:26.263199Z", "loop": 173, "env_steps": 106905599, "loss": 0.01708477921783924, "avg_return": 0.3107137382030487, "regret": 0.49360349774360657, "entropy": 0.7048546075820923, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:29:27.467808Z", "loop": 174, "env_steps": 107519999, "loss": 0.016772886738181114, "avg_return": 0.3109484314918518, "regret": 0.49370333552360535, "entropy": 0.704279899597168, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:29:28.672067Z", "loop": 175, "env_steps": 108134399, "loss": 0.017115846276283264, "avg_return": 0.30997931957244873, "regret": 0.4937172532081604, "entropy": 0.7041161060333252, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:29:29.875974Z", "loop": 176, "env_steps": 108748799, "loss": 0.01709039695560932, "avg_return": 0.31598278880119324, "regret": 0.4936997592449188, "entropy": 0.7040472030639648, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:29:31.079613Z", "loop": 177, "env_steps": 109363199, "loss": 0.017656447365880013, "avg_return": 0.3097248077392578, "regret": 0.4935157299041748, "entropy": 0.7044825553894043, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:29:32.281449Z", "loop": 178, "env_steps": 109977599, "loss": 0.017750268802046776, "avg_return": 0.3008081018924713, "regret": 0.4933328330516815, "entropy": 0.7050231695175171, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:29:33.487344Z", "loop": 179, "env_steps": 110591999, "loss": 0.016785170882940292, "avg_return": 0.3113105893135071, "regret": 0.4931808412075043, "entropy": 0.7055598497390747, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:29:34.692863Z", "loop": 180, "env_steps": 111206399, "loss": 0.016068879514932632, "avg_return": 0.31364527344703674, "regret": 0.493038535118103, "entropy": 0.7060445547103882, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:29:35.897406Z", "loop": 181, "env_steps": 111820799, "loss": 0.017655149102211, "avg_return": 0.31565937399864197, "regret": 0.4929521083831787, "entropy": 0.7063069939613342, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:29:37.101596Z", "loop": 182, "env_steps": 112435199, "loss": 0.017016980797052383, "avg_return": 0.3018706440925598, "regret": 0.4928816854953766, "entropy": 0.7064894437789917, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:29:38.309093Z", "loop": 183, "env_steps": 113049599, "loss": 0.017186909914016724, "avg_return": 0.31666100025177, "regret": 0.49286630749702454, "entropy": 0.7064089179039001, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:29:39.512908Z", "loop": 184, "env_steps": 113663999, "loss": 0.016743162646889687, "avg_return": 0.31111419200897217, "regret": 0.4929324686527252, "entropy": 0.7060978412628174, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:29:40.718329Z", "loop": 185, "env_steps": 114278399, "loss": 0.017044853419065475, "avg_return": 0.3161506652832031, "regret": 0.4930868446826935, "entropy": 0.7054283618927002, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:29:41.922901Z", "loop": 186, "env_steps": 114892799, "loss": 0.016522424295544624, "avg_return": 0.31368961930274963, "regret": 0.4932660460472107, "entropy": 0.7046474814414978, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:29:43.127322Z", "loop": 187, "env_steps": 115507199, "loss": 0.017205726355314255, "avg_return": 0.3112691342830658, "regret": 0.4933374524116516, "entropy": 0.7042423486709595, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:29:44.331556Z", "loop": 188, "env_steps": 116121599, "loss": 0.01610752008855343, "avg_return": 0.3030131459236145, "regret": 0.4933159053325653, "entropy": 0.7041560411453247, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:29:45.536912Z", "loop": 189, "env_steps": 116735999, "loss": 0.01709417812526226, "avg_return": 0.3081485629081726, "regret": 0.4932255446910858, "entropy": 0.704321026802063, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:29:46.740874Z", "loop": 190, "env_steps": 117350399, "loss": 0.017324261367321014, "avg_return": 0.3126811683177948, "regret": 0.493113249540329, "entropy": 0.7046568989753723, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:29:47.945962Z", "loop": 191, "env_steps": 117964799, "loss": 0.015827931463718414, "avg_return": 0.31031155586242676, "regret": 0.49306124448776245, "entropy": 0.7047454118728638, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:29:49.149790Z", "loop": 192, "env_steps": 118579199, "loss": 0.016030510887503624, "avg_return": 0.30922263860702515, "regret": 0.49292001128196716, "entropy": 0.7050750851631165, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:29:50.362720Z", "loop": 193, "env_steps": 119193599, "loss": 0.01737028919160366, "avg_return": 0.3126196265220642, "regret": 0.49282950162887573, "entropy": 0.7051569819450378, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:29:51.566985Z", "loop": 194, "env_steps": 119807999, "loss": 0.017594968900084496, "avg_return": 0.3132794201374054, "regret": 0.4928867220878601, "entropy": 0.7047502398490906, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:29:52.772260Z", "loop": 195, "env_steps": 120422399, "loss": 0.018025584518909454, "avg_return": 0.3136318027973175, "regret": 0.4930928945541382, "entropy": 0.7038224935531616, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:29:53.975466Z", "loop": 196, "env_steps": 121036799, "loss": 0.0175874512642622, "avg_return": 0.31311458349227905, "regret": 0.4932434558868408, "entropy": 0.703156054019928, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:29:55.179459Z", "loop": 197, "env_steps": 121651199, "loss": 0.01664760708808899, "avg_return": 0.3142191469669342, "regret": 0.4932432174682617, "entropy": 0.7030254602432251, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:29:56.384978Z", "loop": 198, "env_steps": 122265599, "loss": 0.01639559678733349, "avg_return": 0.30713528394699097, "regret": 0.49317100644111633, "entropy": 0.7032769322395325, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:29:57.590658Z", "loop": 199, "env_steps": 122879999, "loss": 0.016576936468482018, "avg_return": 0.3009487986564636, "regret": 0.4930569529533386, "entropy": 0.7036612033843994, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:29:58.793726Z", "loop": 200, "env_steps": 123494399, "loss": 0.016672655940055847, "avg_return": 0.3073223829269409, "regret": 0.49294406175613403, "entropy": 0.7040823698043823, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:29:59.996631Z", "loop": 201, "env_steps": 124108799, "loss": 0.01779278926551342, "avg_return": 0.3072970509529114, "regret": 0.4928591847419739, "entropy": 0.7043743133544922, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:30:01.200249Z", "loop": 202, "env_steps": 124723199, "loss": 0.016844550147652626, "avg_return": 0.3148791790008545, "regret": 0.49281173944473267, "entropy": 0.7046093344688416, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:30:02.403782Z", "loop": 203, "env_steps": 125337599, "loss": 0.01586911454796791, "avg_return": 0.30770015716552734, "regret": 0.49282529950141907, "entropy": 0.7046534419059753, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:30:03.606320Z", "loop": 204, "env_steps": 125951999, "loss": 0.01736343465745449, "avg_return": 0.3177526891231537, "regret": 0.49285829067230225, "entropy": 0.7045257687568665, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:30:04.810295Z", "loop": 205, "env_steps": 126566399, "loss": 0.018953803926706314, "avg_return": 0.31070801615715027, "regret": 0.49289894104003906, "entropy": 0.704319953918457, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:30:06.014226Z", "loop": 206, "env_steps": 127180799, "loss": 0.015520353801548481, "avg_return": 0.3103034794330597, "regret": 0.492958128452301, "entropy": 0.7040324211120605, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:30:07.217930Z", "loop": 207, "env_steps": 127795199, "loss": 0.017317304387688637, "avg_return": 0.31286346912384033, "regret": 0.49304163455963135, "entropy": 0.7037216424942017, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:30:08.421311Z", "loop": 208, "env_steps": 128409599, "loss": 0.016508188098669052, "avg_return": 0.3117850124835968, "regret": 0.4930132329463959, "entropy": 0.7037335634231567, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:30:09.626374Z", "loop": 209, "env_steps": 129023999, "loss": 0.01773579604923725, "avg_return": 0.31362006068229675, "regret": 0.4929473102092743, "entropy": 0.703918993473053, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:30:10.828200Z", "loop": 210, "env_steps": 129638399, "loss": 0.017226114869117737, "avg_return": 0.3100922107696533, "regret": 0.4928964674472809, "entropy": 0.7040286064147949, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:30:12.029681Z", "loop": 211, "env_steps": 130252799, "loss": 0.01659531332552433, "avg_return": 0.31447163224220276, "regret": 0.4928513765335083, "entropy": 0.7041540145874023, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:30:13.237866Z", "loop": 212, "env_steps": 130867199, "loss": 0.017685111612081528, "avg_return": 0.317320317029953, "regret": 0.49280259013175964, "entropy": 0.7042707204818726, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:30:14.442886Z", "loop": 213, "env_steps": 131481599, "loss": 0.01767685078084469, "avg_return": 0.3104735314846039, "regret": 0.49280932545661926, "entropy": 0.7042058706283569, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:30:15.644539Z", "loop": 214, "env_steps": 132095999, "loss": 0.015809452161192894, "avg_return": 0.3114550709724426, "regret": 0.4928477108478546, "entropy": 0.7040035724639893, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:30:16.847343Z", "loop": 215, "env_steps": 132710399, "loss": 0.016652055084705353, "avg_return": 0.31615662574768066, "regret": 0.4928813874721527, "entropy": 0.7038909196853638, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:30:18.048576Z", "loop": 216, "env_steps": 133324799, "loss": 0.016204558312892914, "avg_return": 0.30768856406211853, "regret": 0.49290141463279724, "entropy": 0.7037862539291382, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:30:19.248714Z", "loop": 217, "env_steps": 133939199, "loss": 0.01709924265742302, "avg_return": 0.30643534660339355, "regret": 0.49298742413520813, "entropy": 0.7034909129142761, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:30:20.449584Z", "loop": 218, "env_steps": 134553599, "loss": 0.016319258138537407, "avg_return": 0.31323742866516113, "regret": 0.4929846525192261, "entropy": 0.703519344329834, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:30:21.651531Z", "loop": 219, "env_steps": 135167999, "loss": 0.016947677358984947, "avg_return": 0.31481367349624634, "regret": 0.49298274517059326, "entropy": 0.70357346534729, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:30:22.853848Z", "loop": 220, "env_steps": 135782399, "loss": 0.015574710443615913, "avg_return": 0.31210851669311523, "regret": 0.49293893575668335, "entropy": 0.7037078142166138, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:30:24.055142Z", "loop": 221, "env_steps": 136396799, "loss": 0.016430385410785675, "avg_return": 0.3121253550052643, "regret": 0.4928744435310364, "entropy": 0.7039797902107239, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:30:25.259911Z", "loop": 222, "env_steps": 137011199, "loss": 0.016803331673145294, "avg_return": 0.3082413375377655, "regret": 0.49284520745277405, "entropy": 0.704152524471283, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:30:26.461053Z", "loop": 223, "env_steps": 137625599, "loss": 0.015663204714655876, "avg_return": 0.31008750200271606, "regret": 0.4928325414657593, "entropy": 0.7042971849441528, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:30:27.664252Z", "loop": 224, "env_steps": 138239999, "loss": 0.017362719401717186, "avg_return": 0.31146979331970215, "regret": 0.49283477663993835, "entropy": 0.704334557056427, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:30:28.868940Z", "loop": 225, "env_steps": 138854399, "loss": 0.0152704743668437, "avg_return": 0.30320143699645996, "regret": 0.49283885955810547, "entropy": 0.7043480277061462, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:30:30.079314Z", "loop": 226, "env_steps": 139468799, "loss": 0.01807366870343685, "avg_return": 0.3186086118221283, "regret": 0.4928385615348816, "entropy": 0.7043298482894897, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:30:31.282091Z", "loop": 227, "env_steps": 140083199, "loss": 0.017236143350601196, "avg_return": 0.310263454914093, "regret": 0.4928235709667206, "entropy": 0.7043361663818359, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:30:32.486288Z", "loop": 228, "env_steps": 140697599, "loss": 0.016851285472512245, "avg_return": 0.3117119371891022, "regret": 0.49281057715415955, "entropy": 0.7043894529342651, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:30:33.692489Z", "loop": 229, "env_steps": 141311999, "loss": 0.01676223799586296, "avg_return": 0.3052944242954254, "regret": 0.4928053319454193, "entropy": 0.7044582962989807, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:30:34.896877Z", "loop": 230, "env_steps": 141926399, "loss": 0.016310425475239754, "avg_return": 0.3065745234489441, "regret": 0.49280187487602234, "entropy": 0.7044634819030762, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:30:36.102009Z", "loop": 231, "env_steps": 142540799, "loss": 0.016897717490792274, "avg_return": 0.3111893832683563, "regret": 0.49282127618789673, "entropy": 0.7044711112976074, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:30:37.307234Z", "loop": 232, "env_steps": 143155199, "loss": 0.01703042909502983, "avg_return": 0.31026893854141235, "regret": 0.4928344488143921, "entropy": 0.7044567465782166, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:30:38.512289Z", "loop": 233, "env_steps": 143769599, "loss": 0.01694631576538086, "avg_return": 0.3105829358100891, "regret": 0.4928445816040039, "entropy": 0.7045193314552307, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:30:39.717361Z", "loop": 234, "env_steps": 144383999, "loss": 0.017092248424887657, "avg_return": 0.3117789030075073, "regret": 0.49287599325180054, "entropy": 0.7044987082481384, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:30:40.923049Z", "loop": 235, "env_steps": 144998399, "loss": 0.01807555928826332, "avg_return": 0.315054327249527, "regret": 0.49290192127227783, "entropy": 0.7043448090553284, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:30:42.126509Z", "loop": 236, "env_steps": 145612799, "loss": 0.01760820858180523, "avg_return": 0.31801360845565796, "regret": 0.492929071187973, "entropy": 0.7041604518890381, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:30:43.329983Z", "loop": 237, "env_steps": 146227199, "loss": 0.016272395849227905, "avg_return": 0.3049839735031128, "regret": 0.49292922019958496, "entropy": 0.7039495706558228, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:30:44.540781Z", "loop": 238, "env_steps": 146841599, "loss": 0.016529925167560577, "avg_return": 0.30686286091804504, "regret": 0.4929485619068146, "entropy": 0.7036911249160767, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:30:45.748378Z", "loop": 239, "env_steps": 147455999, "loss": 0.01645919680595398, "avg_return": 0.30946484208106995, "regret": 0.49298012256622314, "entropy": 0.7034076452255249, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:30:46.953941Z", "loop": 240, "env_steps": 148070399, "loss": 0.01642797142267227, "avg_return": 0.3056511878967285, "regret": 0.49295705556869507, "entropy": 0.7033112645149231, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:30:48.160186Z", "loop": 241, "env_steps": 148684799, "loss": 0.0159669890999794, "avg_return": 0.307687908411026, "regret": 0.492905855178833, "entropy": 0.7032392024993896, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:30:49.366220Z", "loop": 242, "env_steps": 149299199, "loss": 0.01597871072590351, "avg_return": 0.30483052134513855, "regret": 0.49283960461616516, "entropy": 0.7032577991485596, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:30:50.568669Z", "loop": 243, "env_steps": 149913599, "loss": 0.01573486439883709, "avg_return": 0.30792585015296936, "regret": 0.49278029799461365, "entropy": 0.7032633423805237, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:30:51.773147Z", "loop": 244, "env_steps": 150527999, "loss": 0.01738623157143593, "avg_return": 0.3090653419494629, "regret": 0.49277839064598083, "entropy": 0.7030676007270813, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:30:52.986618Z", "loop": 245, "env_steps": 151142399, "loss": 0.0159161314368248, "avg_return": 0.3102927505970001, "regret": 0.49284979701042175, "entropy": 0.7025949358940125, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:30:54.200842Z", "loop": 246, "env_steps": 151756799, "loss": 0.017351431772112846, "avg_return": 0.3131580650806427, "regret": 0.49298691749572754, "entropy": 0.701953649520874, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:30:55.413720Z", "loop": 247, "env_steps": 152371199, "loss": 0.017303021624684334, "avg_return": 0.30892229080200195, "regret": 0.493021696805954, "entropy": 0.7016770839691162, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:30:56.619365Z", "loop": 248, "env_steps": 152985599, "loss": 0.015824321657419205, "avg_return": 0.31153011322021484, "regret": 0.4929869472980499, "entropy": 0.7016884088516235, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:30:57.825663Z", "loop": 249, "env_steps": 153599999, "loss": 0.017039744183421135, "avg_return": 0.3109692335128784, "regret": 0.49297821521759033, "entropy": 0.7016317248344421, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:30:59.034591Z", "loop": 250, "env_steps": 154214399, "loss": 0.016042063012719154, "avg_return": 0.3142528235912323, "regret": 0.4929029047489166, "entropy": 0.7018283605575562, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:31:00.194898Z", "loop": 251, "env_steps": 154828799, "loss": 0.017153481021523476, "avg_return": 0.3101733922958374, "regret": 0.4929029047489166, "entropy": 0.7020363807678223, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:31:01.398197Z", "loop": 252, "env_steps": 155443199, "loss": 0.01701292395591736, "avg_return": 0.3131032884120941, "regret": 0.4927516579627991, "entropy": 0.7022193074226379, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:31:02.558202Z", "loop": 253, "env_steps": 156057599, "loss": 0.018017655238509178, "avg_return": 0.3147173523902893, "regret": 0.4927516579627991, "entropy": 0.7021082043647766, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:31:03.784660Z", "loop": 254, "env_steps": 156671999, "loss": 0.01704416424036026, "avg_return": 0.31672531366348267, "regret": 0.49280738830566406, "entropy": 0.7017739415168762, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:31:04.949964Z", "loop": 255, "env_steps": 157286399, "loss": 0.016587959602475166, "avg_return": 0.3131595849990845, "regret": 0.49280738830566406, "entropy": 0.7013118863105774, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:31:06.157908Z", "loop": 256, "env_steps": 157900799, "loss": 0.017040036618709564, "avg_return": 0.30826371908187866, "regret": 0.4930555522441864, "entropy": 0.7006559371948242, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:31:07.325273Z", "loop": 257, "env_steps": 158515199, "loss": 0.016082480549812317, "avg_return": 0.3149966299533844, "regret": 0.4930555522441864, "entropy": 0.7001913785934448, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:31:08.530494Z", "loop": 258, "env_steps": 159129599, "loss": 0.01645771414041519, "avg_return": 0.3051759898662567, "regret": 0.4930451512336731, "entropy": 0.7003406882286072, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:31:09.689625Z", "loop": 259, "env_steps": 159743999, "loss": 0.01592382974922657, "avg_return": 0.3070591688156128, "regret": 0.4930451512336731, "entropy": 0.7005044221878052, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:31:10.891889Z", "loop": 260, "env_steps": 160358399, "loss": 0.017196616157889366, "avg_return": 0.31009989976882935, "regret": 0.4928772747516632, "entropy": 0.7007157802581787, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:31:12.056116Z", "loop": 261, "env_steps": 160972799, "loss": 0.01650628075003624, "avg_return": 0.31013059616088867, "regret": 0.4928772747516632, "entropy": 0.7007243037223816, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:31:13.264146Z", "loop": 262, "env_steps": 161587199, "loss": 0.01749620959162712, "avg_return": 0.3111076056957245, "regret": 0.49277040362358093, "entropy": 0.7007896900177002, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:31:14.423734Z", "loop": 263, "env_steps": 162201599, "loss": 0.01678384654223919, "avg_return": 0.3103034496307373, "regret": 0.49277040362358093, "entropy": 0.7007498741149902, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:31:15.625649Z", "loop": 264, "env_steps": 162815999, "loss": 0.0164840929210186, "avg_return": 0.3081698715686798, "regret": 0.4927017390727997, "entropy": 0.7006300091743469, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:31:16.788419Z", "loop": 265, "env_steps": 163430399, "loss": 0.016431553289294243, "avg_return": 0.31326809525489807, "regret": 0.4927017390727997, "entropy": 0.7004895210266113, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:31:18.000584Z", "loop": 266, "env_steps": 164044799, "loss": 0.015677304938435555, "avg_return": 0.3051186800003052, "regret": 0.49270713329315186, "entropy": 0.7004112005233765, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:31:19.159969Z", "loop": 267, "env_steps": 164659199, "loss": 0.016544781625270844, "avg_return": 0.30879706144332886, "regret": 0.49270713329315186, "entropy": 0.7003039121627808, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:31:20.364643Z", "loop": 268, "env_steps": 165273599, "loss": 0.017491037026047707, "avg_return": 0.3112756013870239, "regret": 0.49269425868988037, "entropy": 0.7002220153808594, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:31:21.523281Z", "loop": 269, "env_steps": 165887999, "loss": 0.016258439049124718, "avg_return": 0.3135356307029724, "regret": 0.49269425868988037, "entropy": 0.7001041173934937, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:31:22.724436Z", "loop": 270, "env_steps": 166502399, "loss": 0.016960851848125458, "avg_return": 0.31281259655952454, "regret": 0.4926910996437073, "entropy": 0.6999672055244446, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:31:23.884289Z", "loop": 271, "env_steps": 167116799, "loss": 0.017272362485527992, "avg_return": 0.3133603632450104, "regret": 0.4926910996437073, "entropy": 0.6998372673988342, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:31:25.086713Z", "loop": 272, "env_steps": 167731199, "loss": 0.018023056909441948, "avg_return": 0.3138270676136017, "regret": 0.49269920587539673, "entropy": 0.6996610164642334, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:31:26.245826Z", "loop": 273, "env_steps": 168345599, "loss": 0.016968563199043274, "avg_return": 0.31236982345581055, "regret": 0.49269920587539673, "entropy": 0.6993549466133118, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:31:27.456640Z", "loop": 274, "env_steps": 168959999, "loss": 0.0171893872320652, "avg_return": 0.31054964661598206, "regret": 0.4927738606929779, "entropy": 0.6992321014404297, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:31:28.616527Z", "loop": 275, "env_steps": 169574399, "loss": 0.015383407473564148, "avg_return": 0.30318447947502136, "regret": 0.4927738606929779, "entropy": 0.6989989280700684, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:31:29.837547Z", "loop": 276, "env_steps": 170188799, "loss": 0.01633233204483986, "avg_return": 0.3135007917881012, "regret": 0.4928974211215973, "entropy": 0.698700487613678, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:31:30.996658Z", "loop": 277, "env_steps": 170803199, "loss": 0.01649201288819313, "avg_return": 0.30526337027549744, "regret": 0.4928974211215973, "entropy": 0.6986768245697021, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:31:32.199258Z", "loop": 278, "env_steps": 171417599, "loss": 0.017243972048163414, "avg_return": 0.31256359815597534, "regret": 0.4928836524486542, "entropy": 0.6987030506134033, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:31:33.359048Z", "loop": 279, "env_steps": 172031999, "loss": 0.017342664301395416, "avg_return": 0.31272175908088684, "regret": 0.4928836524486542, "entropy": 0.6989496946334839, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:31:34.565075Z", "loop": 280, "env_steps": 172646399, "loss": 0.016654713079333305, "avg_return": 0.3108184039592743, "regret": 0.49272409081459045, "entropy": 0.6992294788360596, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:31:35.724808Z", "loop": 281, "env_steps": 173260799, "loss": 0.016612617298960686, "avg_return": 0.3077715039253235, "regret": 0.49272409081459045, "entropy": 0.6994348168373108, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:31:36.934280Z", "loop": 282, "env_steps": 173875199, "loss": 0.016622770577669144, "avg_return": 0.3128705620765686, "regret": 0.4927063584327698, "entropy": 0.6993678212165833, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:31:38.094462Z", "loop": 283, "env_steps": 174489599, "loss": 0.016131412237882614, "avg_return": 0.30550438165664673, "regret": 0.4927063584327698, "entropy": 0.6991231441497803, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:31:39.298047Z", "loop": 284, "env_steps": 175103999, "loss": 0.016282744705677032, "avg_return": 0.30526378750801086, "regret": 0.4929552674293518, "entropy": 0.698630154132843, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:31:40.457977Z", "loop": 285, "env_steps": 175718399, "loss": 0.016800791025161743, "avg_return": 0.3123561143875122, "regret": 0.4929552674293518, "entropy": 0.6978951096534729, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:31:41.662613Z", "loop": 286, "env_steps": 176332799, "loss": 0.015432434156537056, "avg_return": 0.3133203089237213, "regret": 0.49335235357284546, "entropy": 0.6973963379859924, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:31:42.821995Z", "loop": 287, "env_steps": 176947199, "loss": 0.017229897901415825, "avg_return": 0.3084478974342346, "regret": 0.49335235357284546, "entropy": 0.6976672410964966, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:31:44.026134Z", "loop": 288, "env_steps": 177561599, "loss": 0.0169879999011755, "avg_return": 0.31458213925361633, "regret": 0.4930715262889862, "entropy": 0.6983570456504822, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:31:45.186151Z", "loop": 289, "env_steps": 178175999, "loss": 0.01799248717725277, "avg_return": 0.3138207793235779, "regret": 0.4930715262889862, "entropy": 0.6989949941635132, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:31:46.388020Z", "loop": 290, "env_steps": 178790399, "loss": 0.017532164230942726, "avg_return": 0.3077736496925354, "regret": 0.4926905930042267, "entropy": 0.6996084451675415, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:31:47.546208Z", "loop": 291, "env_steps": 179404799, "loss": 0.018322890624403954, "avg_return": 0.3182426989078522, "regret": 0.4926905930042267, "entropy": 0.6994994282722473, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:31:48.748024Z", "loop": 292, "env_steps": 180019199, "loss": 0.017533011734485626, "avg_return": 0.3102397322654724, "regret": 0.4928527772426605, "entropy": 0.6989312171936035, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:31:49.907886Z", "loop": 293, "env_steps": 180633599, "loss": 0.016160747036337852, "avg_return": 0.3140883445739746, "regret": 0.4928527772426605, "entropy": 0.6981921195983887, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:31:51.111042Z", "loop": 294, "env_steps": 181247999, "loss": 0.016749843955039978, "avg_return": 0.308432012796402, "regret": 0.4932999014854431, "entropy": 0.6973415613174438, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:31:52.269762Z", "loop": 295, "env_steps": 181862399, "loss": 0.01726566068828106, "avg_return": 0.3122888207435608, "regret": 0.4932999014854431, "entropy": 0.696377158164978, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:31:53.472158Z", "loop": 296, "env_steps": 182476799, "loss": 0.017042694613337517, "avg_return": 0.30801457166671753, "regret": 0.4935760200023651, "entropy": 0.6964012384414673, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:31:54.630163Z", "loop": 297, "env_steps": 183091199, "loss": 0.01632496528327465, "avg_return": 0.3040715754032135, "regret": 0.4935760200023651, "entropy": 0.696967363357544, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:31:55.833158Z", "loop": 298, "env_steps": 183705599, "loss": 0.01589909754693508, "avg_return": 0.30781131982803345, "regret": 0.4931797981262207, "entropy": 0.6978851556777954, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:31:56.997764Z", "loop": 299, "env_steps": 184319999, "loss": 0.01693417690694332, "avg_return": 0.31828629970550537, "regret": 0.4931797981262207, "entropy": 0.69837486743927, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:31:58.206114Z", "loop": 300, "env_steps": 184934399, "loss": 0.016280733048915863, "avg_return": 0.30921754240989685, "regret": 0.49289608001708984, "entropy": 0.6988879442214966, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:31:59.366580Z", "loop": 301, "env_steps": 185548799, "loss": 0.0160520076751709, "avg_return": 0.30455338954925537, "regret": 0.49289608001708984, "entropy": 0.6994931697845459, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:32:00.571575Z", "loop": 302, "env_steps": 186163199, "loss": 0.01642341911792755, "avg_return": 0.3013341724872589, "regret": 0.4926796555519104, "entropy": 0.6997859477996826, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:32:01.729994Z", "loop": 303, "env_steps": 186777599, "loss": 0.015759680420160294, "avg_return": 0.30909547209739685, "regret": 0.4926796555519104, "entropy": 0.6997933983802795, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:32:02.940502Z", "loop": 304, "env_steps": 187391999, "loss": 0.016672994941473007, "avg_return": 0.30892691016197205, "regret": 0.49278947710990906, "entropy": 0.699520468711853, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:32:04.099819Z", "loop": 305, "env_steps": 188006399, "loss": 0.01603337749838829, "avg_return": 0.30645549297332764, "regret": 0.49278947710990906, "entropy": 0.6992334723472595, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:32:05.304616Z", "loop": 306, "env_steps": 188620799, "loss": 0.017153970897197723, "avg_return": 0.3123440146446228, "regret": 0.4930381774902344, "entropy": 0.6988174915313721, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:32:06.463944Z", "loop": 307, "env_steps": 189235199, "loss": 0.01639510691165924, "avg_return": 0.31028974056243896, "regret": 0.4930381774902344, "entropy": 0.6985864639282227, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:32:07.668005Z", "loop": 308, "env_steps": 189849599, "loss": 0.01674068532884121, "avg_return": 0.3059377670288086, "regret": 0.4931808412075043, "entropy": 0.6983150243759155, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:32:08.827139Z", "loop": 309, "env_steps": 190463999, "loss": 0.016500256955623627, "avg_return": 0.3128979504108429, "regret": 0.4931808412075043, "entropy": 0.6975871920585632, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:32:10.029298Z", "loop": 310, "env_steps": 191078399, "loss": 0.01809420995414257, "avg_return": 0.3129512071609497, "regret": 0.4934794008731842, "entropy": 0.6972376704216003, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:32:11.190053Z", "loop": 311, "env_steps": 191692799, "loss": 0.01643914356827736, "avg_return": 0.3094683289527893, "regret": 0.4934794008731842, "entropy": 0.6973019242286682, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:32:12.394267Z", "loop": 312, "env_steps": 192307199, "loss": 0.016699058935046196, "avg_return": 0.31706249713897705, "regret": 0.49333566427230835, "entropy": 0.6975889205932617, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:32:13.554121Z", "loop": 313, "env_steps": 192921599, "loss": 0.016680916771292686, "avg_return": 0.309171199798584, "regret": 0.49333566427230835, "entropy": 0.6985297203063965, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:32:14.757910Z", "loop": 314, "env_steps": 193535999, "loss": 0.017371727153658867, "avg_return": 0.3071453273296356, "regret": 0.4928155541419983, "entropy": 0.6990306377410889, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:32:15.923912Z", "loop": 315, "env_steps": 194150399, "loss": 0.016460087150335312, "avg_return": 0.305347740650177, "regret": 0.4928155541419983, "entropy": 0.6992761492729187, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:32:17.127706Z", "loop": 316, "env_steps": 194764799, "loss": 0.016736192628741264, "avg_return": 0.30836132168769836, "regret": 0.4926700294017792, "entropy": 0.6991435289382935, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:32:18.287361Z", "loop": 317, "env_steps": 195379199, "loss": 0.0157629381865263, "avg_return": 0.31270402669906616, "regret": 0.4926700294017792, "entropy": 0.6984701156616211, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:32:19.493758Z", "loop": 318, "env_steps": 195993599, "loss": 0.016563963145017624, "avg_return": 0.3046528995037079, "regret": 0.49296584725379944, "entropy": 0.6977705955505371, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:32:20.656553Z", "loop": 319, "env_steps": 196607999, "loss": 0.015917662531137466, "avg_return": 0.3084213435649872, "regret": 0.49296584725379944, "entropy": 0.6967100501060486, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:32:21.866241Z", "loop": 320, "env_steps": 197222399, "loss": 0.017126120626926422, "avg_return": 0.3078668713569641, "regret": 0.4932805895805359, "entropy": 0.6965446472167969, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:32:23.025947Z", "loop": 321, "env_steps": 197836799, "loss": 0.017214056104421616, "avg_return": 0.31201472878456116, "regret": 0.4932805895805359, "entropy": 0.6971296072006226, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:32:24.227275Z", "loop": 322, "env_steps": 198451199, "loss": 0.01646602712571621, "avg_return": 0.3106352686882019, "regret": 0.492838591337204, "entropy": 0.6980766654014587, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:32:25.388293Z", "loop": 323, "env_steps": 199065599, "loss": 0.0160924531519413, "avg_return": 0.30051320791244507, "regret": 0.492838591337204, "entropy": 0.6987059712409973, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:32:26.599672Z", "loop": 324, "env_steps": 199679999, "loss": 0.017535587772727013, "avg_return": 0.3122901916503906, "regret": 0.4926583468914032, "entropy": 0.6988435387611389, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:32:27.759966Z", "loop": 325, "env_steps": 200294399, "loss": 0.01670982874929905, "avg_return": 0.3104144334793091, "regret": 0.4926583468914032, "entropy": 0.6985654830932617, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:32:28.963720Z", "loop": 326, "env_steps": 200908799, "loss": 0.016069909557700157, "avg_return": 0.3069497346878052, "regret": 0.49285343289375305, "entropy": 0.6982465386390686, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:32:30.123663Z", "loop": 327, "env_steps": 201523199, "loss": 0.016565224155783653, "avg_return": 0.31113964319229126, "regret": 0.49285343289375305, "entropy": 0.6980710625648499, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:32:31.333470Z", "loop": 328, "env_steps": 202137599, "loss": 0.01701582781970501, "avg_return": 0.3174324631690979, "regret": 0.4929223358631134, "entropy": 0.6980171799659729, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:32:32.496703Z", "loop": 329, "env_steps": 202751999, "loss": 0.015434137545526028, "avg_return": 0.31254345178604126, "regret": 0.4929223358631134, "entropy": 0.6979250907897949, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:32:33.710692Z", "loop": 330, "env_steps": 203366399, "loss": 0.017276285216212273, "avg_return": 0.3178202211856842, "regret": 0.4928774833679199, "entropy": 0.6981230974197388, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:32:34.873529Z", "loop": 331, "env_steps": 203980799, "loss": 0.017023079097270966, "avg_return": 0.3086860179901123, "regret": 0.4928774833679199, "entropy": 0.6983580589294434, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:32:36.079734Z", "loop": 332, "env_steps": 204595199, "loss": 0.01647188514471054, "avg_return": 0.31111955642700195, "regret": 0.4926958680152893, "entropy": 0.698641300201416, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:32:37.237881Z", "loop": 333, "env_steps": 205209599, "loss": 0.017374727874994278, "avg_return": 0.3108121454715729, "regret": 0.4926958680152893, "entropy": 0.6987584829330444, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:32:38.438327Z", "loop": 334, "env_steps": 205823999, "loss": 0.016872979700565338, "avg_return": 0.3089364767074585, "regret": 0.49267154932022095, "entropy": 0.6985971927642822, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:32:39.598380Z", "loop": 335, "env_steps": 206438399, "loss": 0.016185076907277107, "avg_return": 0.30813929438591003, "regret": 0.49267154932022095, "entropy": 0.6981154680252075, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:32:40.804419Z", "loop": 336, "env_steps": 207052799, "loss": 0.01744386926293373, "avg_return": 0.3120706379413605, "regret": 0.4929090142250061, "entropy": 0.6976979970932007, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:32:41.967307Z", "loop": 337, "env_steps": 207667199, "loss": 0.01740153692662716, "avg_return": 0.3229641020298004, "regret": 0.4929090142250061, "entropy": 0.6972835659980774, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:32:43.169928Z", "loop": 338, "env_steps": 208281599, "loss": 0.01791517250239849, "avg_return": 0.31858041882514954, "regret": 0.49305543303489685, "entropy": 0.6972479820251465, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:32:44.328519Z", "loop": 339, "env_steps": 208895999, "loss": 0.016332639381289482, "avg_return": 0.3105461597442627, "regret": 0.49305543303489685, "entropy": 0.6978116631507874, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:32:45.530684Z", "loop": 340, "env_steps": 209510399, "loss": 0.01628715544939041, "avg_return": 0.30812868475914, "regret": 0.492773175239563, "entropy": 0.698349118232727, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:32:46.690487Z", "loop": 341, "env_steps": 210124799, "loss": 0.016652105376124382, "avg_return": 0.31033340096473694, "regret": 0.492773175239563, "entropy": 0.6988012790679932, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:32:47.896415Z", "loop": 342, "env_steps": 210739199, "loss": 0.017055897042155266, "avg_return": 0.3163115382194519, "regret": 0.4926488995552063, "entropy": 0.6989766955375671, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:32:49.058233Z", "loop": 343, "env_steps": 211353599, "loss": 0.015371625311672688, "avg_return": 0.3062412142753601, "regret": 0.4926488995552063, "entropy": 0.6988665461540222, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:32:50.263272Z", "loop": 344, "env_steps": 211967999, "loss": 0.016655119135975838, "avg_return": 0.3001866042613983, "regret": 0.4927268326282501, "entropy": 0.6987836360931396, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:32:51.423611Z", "loop": 345, "env_steps": 212582399, "loss": 0.017452191561460495, "avg_return": 0.31334787607192993, "regret": 0.4927268326282501, "entropy": 0.6987166404724121, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:32:52.626070Z", "loop": 346, "env_steps": 213196799, "loss": 0.015850305557250977, "avg_return": 0.30849573016166687, "regret": 0.49276676774024963, "entropy": 0.6986733078956604, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:32:53.789114Z", "loop": 347, "env_steps": 213811199, "loss": 0.015587860718369484, "avg_return": 0.307422935962677, "regret": 0.49276676774024963, "entropy": 0.6986644864082336, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:32:54.991289Z", "loop": 348, "env_steps": 214425599, "loss": 0.015693331137299538, "avg_return": 0.30790209770202637, "regret": 0.4927140474319458, "entropy": 0.6987388134002686, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:32:56.149692Z", "loop": 349, "env_steps": 215039999, "loss": 0.016318971291184425, "avg_return": 0.3117465674877167, "regret": 0.4927140474319458, "entropy": 0.6987719535827637, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:32:57.352101Z", "loop": 350, "env_steps": 215654399, "loss": 0.01585976593196392, "avg_return": 0.30306050181388855, "regret": 0.49264851212501526, "entropy": 0.6987496018409729, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:32:58.511379Z", "loop": 351, "env_steps": 216268799, "loss": 0.016254276037216187, "avg_return": 0.313513845205307, "regret": 0.49264851212501526, "entropy": 0.69870924949646, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:32:59.715358Z", "loop": 352, "env_steps": 216883199, "loss": 0.01579456403851509, "avg_return": 0.30671554803848267, "regret": 0.49263209104537964, "entropy": 0.6986146569252014, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:33:00.878855Z", "loop": 353, "env_steps": 217497599, "loss": 0.016576072201132774, "avg_return": 0.31450313329696655, "regret": 0.49263209104537964, "entropy": 0.6984468102455139, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:33:02.092769Z", "loop": 354, "env_steps": 218111999, "loss": 0.016727525740861893, "avg_return": 0.3105846345424652, "regret": 0.4927119314670563, "entropy": 0.6981670260429382, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:33:03.260046Z", "loop": 355, "env_steps": 218726399, "loss": 0.016208013519644737, "avg_return": 0.30631569027900696, "regret": 0.4927119314670563, "entropy": 0.6978958249092102, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:33:04.466718Z", "loop": 356, "env_steps": 219340799, "loss": 0.01648029498755932, "avg_return": 0.3095068037509918, "regret": 0.49282175302505493, "entropy": 0.6976955533027649, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:33:05.629758Z", "loop": 357, "env_steps": 219955199, "loss": 0.01671028882265091, "avg_return": 0.3137345314025879, "regret": 0.49282175302505493, "entropy": 0.6973855495452881, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:33:06.838402Z", "loop": 358, "env_steps": 220569599, "loss": 0.016403643414378166, "avg_return": 0.3088187277317047, "regret": 0.49280664324760437, "entropy": 0.6976166367530823, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:33:07.998941Z", "loop": 359, "env_steps": 221183999, "loss": 0.016703756526112556, "avg_return": 0.3072187304496765, "regret": 0.49280664324760437, "entropy": 0.6976896524429321, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:33:09.199310Z", "loop": 360, "env_steps": 221798399, "loss": 0.016934024170041084, "avg_return": 0.31145229935646057, "regret": 0.49272361397743225, "entropy": 0.6978688836097717, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:33:10.357265Z", "loop": 361, "env_steps": 222412799, "loss": 0.018150795251131058, "avg_return": 0.311989426612854, "regret": 0.49272361397743225, "entropy": 0.6981199979782104, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:33:11.558590Z", "loop": 362, "env_steps": 223027199, "loss": 0.017253518104553223, "avg_return": 0.3117537498474121, "regret": 0.4926183521747589, "entropy": 0.6982825994491577, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:33:12.721671Z", "loop": 363, "env_steps": 223641599, "loss": 0.01580747775733471, "avg_return": 0.30580443143844604, "regret": 0.4926183521747589, "entropy": 0.6982521414756775, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:33:13.932805Z", "loop": 364, "env_steps": 224255999, "loss": 0.017120521515607834, "avg_return": 0.31389856338500977, "regret": 0.4926442503929138, "entropy": 0.6982623934745789, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:33:15.094788Z", "loop": 365, "env_steps": 224870399, "loss": 0.01740691252052784, "avg_return": 0.31517744064331055, "regret": 0.4926442503929138, "entropy": 0.6982617378234863, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:33:16.306545Z", "loop": 366, "env_steps": 225484799, "loss": 0.017225926741957664, "avg_return": 0.3151932656764984, "regret": 0.492632657289505, "entropy": 0.6982866525650024, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:33:17.469057Z", "loop": 367, "env_steps": 226099199, "loss": 0.016657225787639618, "avg_return": 0.3098697066307068, "regret": 0.492632657289505, "entropy": 0.6982949376106262, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:33:18.674164Z", "loop": 368, "env_steps": 226713599, "loss": 0.0169602632522583, "avg_return": 0.3168911337852478, "regret": 0.49261587858200073, "entropy": 0.6982901096343994, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:33:19.838047Z", "loop": 369, "env_steps": 227327999, "loss": 0.015975577756762505, "avg_return": 0.30916887521743774, "regret": 0.49261587858200073, "entropy": 0.6982235908508301, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:33:21.042105Z", "loop": 370, "env_steps": 227942399, "loss": 0.01666237600147724, "avg_return": 0.31078416109085083, "regret": 0.49264249205589294, "entropy": 0.6981785297393799, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:33:22.201872Z", "loop": 371, "env_steps": 228556799, "loss": 0.017253631725907326, "avg_return": 0.31369879841804504, "regret": 0.49264249205589294, "entropy": 0.6981409788131714, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:33:23.407005Z", "loop": 372, "env_steps": 229171199, "loss": 0.016064457595348358, "avg_return": 0.311151385307312, "regret": 0.4926609396934509, "entropy": 0.698093831539154, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:33:24.568498Z", "loop": 373, "env_steps": 229785599, "loss": 0.01701505295932293, "avg_return": 0.30877941846847534, "regret": 0.4926609396934509, "entropy": 0.6981573104858398, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:33:25.778341Z", "loop": 374, "env_steps": 230399999, "loss": 0.017187131568789482, "avg_return": 0.31172439455986023, "regret": 0.4926268458366394, "entropy": 0.6981750726699829, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:33:26.938143Z", "loop": 375, "env_steps": 231014399, "loss": 0.017577091231942177, "avg_return": 0.3171466588973999, "regret": 0.4926268458366394, "entropy": 0.6981711387634277, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:33:28.143231Z", "loop": 376, "env_steps": 231628799, "loss": 0.016580617055296898, "avg_return": 0.3102792501449585, "regret": 0.49262911081314087, "entropy": 0.6982137560844421, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:33:29.302888Z", "loop": 377, "env_steps": 232243199, "loss": 0.017468135803937912, "avg_return": 0.3086010217666626, "regret": 0.49262911081314087, "entropy": 0.6983076930046082, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:33:30.506089Z", "loop": 378, "env_steps": 232857599, "loss": 0.01663258485496044, "avg_return": 0.30778738856315613, "regret": 0.4926135241985321, "entropy": 0.6983405351638794, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:33:31.666774Z", "loop": 379, "env_steps": 233471999, "loss": 0.016198309138417244, "avg_return": 0.3112998902797699, "regret": 0.4926135241985321, "entropy": 0.6983417868614197, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:33:32.873616Z", "loop": 380, "env_steps": 234086399, "loss": 0.016423895955085754, "avg_return": 0.31194889545440674, "regret": 0.4926320016384125, "entropy": 0.6983201503753662, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:33:34.035362Z", "loop": 381, "env_steps": 234700799, "loss": 0.01699627749621868, "avg_return": 0.3120344281196594, "regret": 0.4926320016384125, "entropy": 0.6982828974723816, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:33:35.245229Z", "loop": 382, "env_steps": 235315199, "loss": 0.01671167090535164, "avg_return": 0.3114722967147827, "regret": 0.4926655888557434, "entropy": 0.6983026266098022, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:33:36.406985Z", "loop": 383, "env_steps": 235929599, "loss": 0.015475465916097164, "avg_return": 0.31047555804252625, "regret": 0.4926655888557434, "entropy": 0.698249340057373, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:33:37.620006Z", "loop": 384, "env_steps": 236543999, "loss": 0.017632517963647842, "avg_return": 0.30973753333091736, "regret": 0.4927360713481903, "entropy": 0.6981256008148193, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:33:38.783690Z", "loop": 385, "env_steps": 237158399, "loss": 0.018141508102416992, "avg_return": 0.31660208106040955, "regret": 0.4927360713481903, "entropy": 0.6978383660316467, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:33:39.987645Z", "loop": 386, "env_steps": 237772799, "loss": 0.016772253438830376, "avg_return": 0.30533143877983093, "regret": 0.4928225576877594, "entropy": 0.6979163289070129, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:33:41.146939Z", "loop": 387, "env_steps": 238387199, "loss": 0.015938568860292435, "avg_return": 0.30871859192848206, "regret": 0.4928225576877594, "entropy": 0.6980196833610535, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:33:42.350417Z", "loop": 388, "env_steps": 239001599, "loss": 0.016211966052651405, "avg_return": 0.3064146637916565, "regret": 0.4927254319190979, "entropy": 0.6982445120811462, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:33:43.514784Z", "loop": 389, "env_steps": 239615999, "loss": 0.016017107293009758, "avg_return": 0.3135172724723816, "regret": 0.4927254319190979, "entropy": 0.6983290910720825, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:33:44.721760Z", "loop": 390, "env_steps": 240230399, "loss": 0.01655084453523159, "avg_return": 0.30747997760772705, "regret": 0.4926537275314331, "entropy": 0.6984577775001526, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:33:45.881027Z", "loop": 391, "env_steps": 240844799, "loss": 0.0168620478361845, "avg_return": 0.31136205792427063, "regret": 0.4926537275314331, "entropy": 0.698593258857727, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:33:47.080833Z", "loop": 392, "env_steps": 241459199, "loss": 0.017915287986397743, "avg_return": 0.31820160150527954, "regret": 0.49261340498924255, "entropy": 0.6986310482025146, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:33:48.239915Z", "loop": 393, "env_steps": 242073599, "loss": 0.017112476751208305, "avg_return": 0.31544873118400574, "regret": 0.49261340498924255, "entropy": 0.6986252665519714, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:33:49.446808Z", "loop": 394, "env_steps": 242687999, "loss": 0.01677808165550232, "avg_return": 0.3146663308143616, "regret": 0.4926677644252777, "entropy": 0.6984704732894897, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:33:50.610429Z", "loop": 395, "env_steps": 243302399, "loss": 0.01728406734764576, "avg_return": 0.3128182888031006, "regret": 0.4926677644252777, "entropy": 0.6982350945472717, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:33:51.813108Z", "loop": 396, "env_steps": 243916799, "loss": 0.01511857844889164, "avg_return": 0.3089640736579895, "regret": 0.4928118586540222, "entropy": 0.6978601217269897, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:33:52.972214Z", "loop": 397, "env_steps": 244531199, "loss": 0.017108049243688583, "avg_return": 0.3127555847167969, "regret": 0.4928118586540222, "entropy": 0.6977531909942627, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:33:54.173074Z", "loop": 398, "env_steps": 245145599, "loss": 0.01679481938481331, "avg_return": 0.3134595453739166, "regret": 0.4928346574306488, "entropy": 0.6978057026863098, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:33:55.332641Z", "loop": 399, "env_steps": 245759999, "loss": 0.015696225687861443, "avg_return": 0.3076026141643524, "regret": 0.4928346574306488, "entropy": 0.6978252530097961, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:33:56.532319Z", "loop": 400, "env_steps": 246374399, "loss": 0.017059696838259697, "avg_return": 0.31200098991394043, "regret": 0.49277448654174805, "entropy": 0.6979652047157288, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:33:57.693835Z", "loop": 401, "env_steps": 246988799, "loss": 0.01701560616493225, "avg_return": 0.3104493319988251, "regret": 0.49277448654174805, "entropy": 0.6979859471321106, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:33:58.901836Z", "loop": 402, "env_steps": 247603199, "loss": 0.01656602881848812, "avg_return": 0.30608710646629333, "regret": 0.4927248954772949, "entropy": 0.6979900598526001, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:34:00.060513Z", "loop": 403, "env_steps": 248217599, "loss": 0.01729387231171131, "avg_return": 0.31542617082595825, "regret": 0.4927248954772949, "entropy": 0.6980588436126709, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:34:01.264608Z", "loop": 404, "env_steps": 248831999, "loss": 0.016102509573101997, "avg_return": 0.3096776306629181, "regret": 0.4927114248275757, "entropy": 0.697939932346344, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:34:02.424741Z", "loop": 405, "env_steps": 249446399, "loss": 0.015420484356582165, "avg_return": 0.30215877294540405, "regret": 0.4927114248275757, "entropy": 0.6976885199546814, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:34:03.625880Z", "loop": 406, "env_steps": 250060799, "loss": 0.01672150380909443, "avg_return": 0.3127680718898773, "regret": 0.492765873670578, "entropy": 0.6975846886634827, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:34:04.785609Z", "loop": 407, "env_steps": 250675199, "loss": 0.0173275675624609, "avg_return": 0.31190025806427, "regret": 0.492765873670578, "entropy": 0.6976631283760071, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:34:05.986192Z", "loop": 408, "env_steps": 251289599, "loss": 0.016620805487036705, "avg_return": 0.3097103536128998, "regret": 0.4927159547805786, "entropy": 0.6976782083511353, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:34:07.146635Z", "loop": 409, "env_steps": 251903999, "loss": 0.01757306419312954, "avg_return": 0.31460702419281006, "regret": 0.4927159547805786, "entropy": 0.6977767944335938, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:34:08.347446Z", "loop": 410, "env_steps": 252518399, "loss": 0.017177466303110123, "avg_return": 0.3145312964916229, "regret": 0.4926116466522217, "entropy": 0.6980648636817932, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:34:09.509364Z", "loop": 411, "env_steps": 253132799, "loss": 0.015881702303886414, "avg_return": 0.30470338463783264, "regret": 0.4926116466522217, "entropy": 0.6981213092803955, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:34:10.713077Z", "loop": 412, "env_steps": 253747199, "loss": 0.016871115192770958, "avg_return": 0.3139636516571045, "regret": 0.4926438629627228, "entropy": 0.6979553699493408, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:34:11.872693Z", "loop": 413, "env_steps": 254361599, "loss": 0.0175209641456604, "avg_return": 0.31189799308776855, "regret": 0.4926438629627228, "entropy": 0.697638988494873, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:34:13.073300Z", "loop": 414, "env_steps": 254975999, "loss": 0.016935832798480988, "avg_return": 0.31290730834007263, "regret": 0.4928855895996094, "entropy": 0.6970995664596558, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:34:14.232683Z", "loop": 415, "env_steps": 255590399, "loss": 0.017294272780418396, "avg_return": 0.3131525218486786, "regret": 0.4928855895996094, "entropy": 0.6962671279907227, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:34:15.433931Z", "loop": 416, "env_steps": 256204799, "loss": 0.016467301174998283, "avg_return": 0.3113962411880493, "regret": 0.49326807260513306, "entropy": 0.6956614255905151, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:34:16.593654Z", "loop": 417, "env_steps": 256819199, "loss": 0.015588657930493355, "avg_return": 0.3043949007987976, "regret": 0.49326807260513306, "entropy": 0.6959929466247559, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:34:17.792791Z", "loop": 418, "env_steps": 257433599, "loss": 0.016731923446059227, "avg_return": 0.30716225504875183, "regret": 0.4930819571018219, "entropy": 0.6961628198623657, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:34:18.951587Z", "loop": 419, "env_steps": 258047999, "loss": 0.01662631146609783, "avg_return": 0.31440940499305725, "regret": 0.4930819571018219, "entropy": 0.696793794631958, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:34:20.152320Z", "loop": 420, "env_steps": 258662399, "loss": 0.0153469517827034, "avg_return": 0.30215102434158325, "regret": 0.4926642179489136, "entropy": 0.6973605751991272, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:34:21.312359Z", "loop": 421, "env_steps": 259276799, "loss": 0.01694885455071926, "avg_return": 0.3162154257297516, "regret": 0.4926642179489136, "entropy": 0.6975314021110535, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:34:22.514996Z", "loop": 422, "env_steps": 259891199, "loss": 0.017086049541831017, "avg_return": 0.31172966957092285, "regret": 0.49259406328201294, "entropy": 0.697365403175354, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:34:23.678141Z", "loop": 423, "env_steps": 260505599, "loss": 0.015974735841155052, "avg_return": 0.3130836486816406, "regret": 0.49259406328201294, "entropy": 0.6970570087432861, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:34:24.882643Z", "loop": 424, "env_steps": 261119999, "loss": 0.016066420823335648, "avg_return": 0.3087489604949951, "regret": 0.49282410740852356, "entropy": 0.6963303089141846, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:34:26.045582Z", "loop": 425, "env_steps": 261734399, "loss": 0.016629567369818687, "avg_return": 0.3099532723426819, "regret": 0.49282410740852356, "entropy": 0.6956074237823486, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:34:27.248153Z", "loop": 426, "env_steps": 262348799, "loss": 0.016270693391561508, "avg_return": 0.309270441532135, "regret": 0.4931861162185669, "entropy": 0.6948800086975098, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:34:28.409837Z", "loop": 427, "env_steps": 262963199, "loss": 0.016632679849863052, "avg_return": 0.31145137548446655, "regret": 0.4931861162185669, "entropy": 0.6948586702346802, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:34:29.612089Z", "loop": 428, "env_steps": 263577599, "loss": 0.016707396134734154, "avg_return": 0.3122509717941284, "regret": 0.4930076003074646, "entropy": 0.695471465587616, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:34:30.771969Z", "loop": 429, "env_steps": 264191999, "loss": 0.01709958165884018, "avg_return": 0.310952752828598, "regret": 0.4930076003074646, "entropy": 0.6961961388587952, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:34:31.973026Z", "loop": 430, "env_steps": 264806399, "loss": 0.0178849957883358, "avg_return": 0.3103048503398895, "regret": 0.49262502789497375, "entropy": 0.6967909932136536, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:34:33.133189Z", "loop": 431, "env_steps": 265420799, "loss": 0.01666036807000637, "avg_return": 0.30832043290138245, "regret": 0.49262502789497375, "entropy": 0.6969875693321228, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:34:34.333794Z", "loop": 432, "env_steps": 266035199, "loss": 0.017040738835930824, "avg_return": 0.3140946626663208, "regret": 0.492608904838562, "entropy": 0.696836531162262, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:34:35.494691Z", "loop": 433, "env_steps": 266649599, "loss": 0.016055116429924965, "avg_return": 0.30721044540405273, "regret": 0.492608904838562, "entropy": 0.6961259841918945, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:34:36.696180Z", "loop": 434, "env_steps": 267263999, "loss": 0.01747620292007923, "avg_return": 0.3138958811759949, "regret": 0.4930073618888855, "entropy": 0.6954026818275452, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:34:37.857152Z", "loop": 435, "env_steps": 267878399, "loss": 0.017346922308206558, "avg_return": 0.30886876583099365, "regret": 0.4930073618888855, "entropy": 0.6949305534362793, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:34:39.059380Z", "loop": 436, "env_steps": 268492799, "loss": 0.015569222159683704, "avg_return": 0.3081076145172119, "regret": 0.49310028553009033, "entropy": 0.6949722766876221, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:34:40.225214Z", "loop": 437, "env_steps": 269107199, "loss": 0.015477390959858894, "avg_return": 0.30255356431007385, "regret": 0.49310028553009033, "entropy": 0.6955641508102417, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:34:41.432662Z", "loop": 438, "env_steps": 269721599, "loss": 0.018004802986979485, "avg_return": 0.31019139289855957, "regret": 0.49268636107444763, "entropy": 0.6962894797325134, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:34:42.597566Z", "loop": 439, "env_steps": 270335999, "loss": 0.01761358603835106, "avg_return": 0.31018364429473877, "regret": 0.49268636107444763, "entropy": 0.6965802907943726, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:34:43.801837Z", "loop": 440, "env_steps": 270950399, "loss": 0.016172608360648155, "avg_return": 0.3086302876472473, "regret": 0.4925611615180969, "entropy": 0.6966254115104675, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:34:44.966443Z", "loop": 441, "env_steps": 271564799, "loss": 0.016691764816641808, "avg_return": 0.3151727318763733, "regret": 0.4925611615180969, "entropy": 0.6966344714164734, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:34:46.170022Z", "loop": 442, "env_steps": 272179199, "loss": 0.016697274520993233, "avg_return": 0.3174843490123749, "regret": 0.4925489127635956, "entropy": 0.6965807676315308, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:34:47.331098Z", "loop": 443, "env_steps": 272793599, "loss": 0.016059601679444313, "avg_return": 0.3086320161819458, "regret": 0.4925489127635956, "entropy": 0.696547269821167, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:34:48.531467Z", "loop": 444, "env_steps": 273407999, "loss": 0.01605873368680477, "avg_return": 0.3084038496017456, "regret": 0.4925442636013031, "entropy": 0.6965051293373108, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:34:49.692568Z", "loop": 445, "env_steps": 274022399, "loss": 0.016948392614722252, "avg_return": 0.31203678250312805, "regret": 0.4925442636013031, "entropy": 0.6964942812919617, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:34:50.889337Z", "loop": 446, "env_steps": 274636799, "loss": 0.01698162965476513, "avg_return": 0.3111160695552826, "regret": 0.4925401508808136, "entropy": 0.6964688897132874, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:34:52.048507Z", "loop": 447, "env_steps": 275251199, "loss": 0.017763888463377953, "avg_return": 0.3156123459339142, "regret": 0.4925401508808136, "entropy": 0.6964438557624817, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:34:53.246879Z", "loop": 448, "env_steps": 275865599, "loss": 0.017228752374649048, "avg_return": 0.312447726726532, "regret": 0.49255481362342834, "entropy": 0.6964110136032104, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:34:54.405099Z", "loop": 449, "env_steps": 276479999, "loss": 0.01656181924045086, "avg_return": 0.31505364179611206, "regret": 0.49255481362342834, "entropy": 0.6964684128761292, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:34:55.604419Z", "loop": 450, "env_steps": 277094399, "loss": 0.017284460365772247, "avg_return": 0.30810514092445374, "regret": 0.49261245131492615, "entropy": 0.6962339282035828, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:34:56.764258Z", "loop": 451, "env_steps": 277708799, "loss": 0.017239322885870934, "avg_return": 0.3096763491630554, "regret": 0.49261245131492615, "entropy": 0.6958444714546204, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:34:57.961033Z", "loop": 452, "env_steps": 278323199, "loss": 0.017384957522153854, "avg_return": 0.3131764829158783, "regret": 0.49287328124046326, "entropy": 0.6953020095825195, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:34:59.119894Z", "loop": 453, "env_steps": 278937599, "loss": 0.017577368766069412, "avg_return": 0.3113294839859009, "regret": 0.49287328124046326, "entropy": 0.695147693157196, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:35:00.321124Z", "loop": 454, "env_steps": 279551999, "loss": 0.016481947153806686, "avg_return": 0.307247519493103, "regret": 0.49282306432724, "entropy": 0.6953898668289185, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:35:01.484800Z", "loop": 455, "env_steps": 280166399, "loss": 0.01648538187146187, "avg_return": 0.31302890181541443, "regret": 0.49282306432724, "entropy": 0.6961542367935181, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:35:02.683058Z", "loop": 456, "env_steps": 280780799, "loss": 0.018237052485346794, "avg_return": 0.31539395451545715, "regret": 0.4925367534160614, "entropy": 0.6961972713470459, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:35:03.844724Z", "loop": 457, "env_steps": 281395199, "loss": 0.016259005293250084, "avg_return": 0.3116433024406433, "regret": 0.4925367534160614, "entropy": 0.6957238912582397, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:35:05.044140Z", "loop": 458, "env_steps": 282009599, "loss": 0.01661013811826706, "avg_return": 0.3086654841899872, "regret": 0.49287712574005127, "entropy": 0.6949540972709656, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:35:06.207987Z", "loop": 459, "env_steps": 282623999, "loss": 0.016618354246020317, "avg_return": 0.3137986660003662, "regret": 0.49287712574005127, "entropy": 0.694348931312561, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:35:07.420231Z", "loop": 460, "env_steps": 283238399, "loss": 0.016555143520236015, "avg_return": 0.3146437406539917, "regret": 0.49313855171203613, "entropy": 0.694004476070404, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:35:08.581628Z", "loop": 461, "env_steps": 283852799, "loss": 0.017174314707517624, "avg_return": 0.31374865770339966, "regret": 0.49313855171203613, "entropy": 0.6942046880722046, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:35:09.789347Z", "loop": 462, "env_steps": 284467199, "loss": 0.017420582473278046, "avg_return": 0.3106357157230377, "regret": 0.49289020895957947, "entropy": 0.6949037909507751, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:35:10.948816Z", "loop": 463, "env_steps": 285081599, "loss": 0.01570034585893154, "avg_return": 0.3027271628379822, "regret": 0.49289020895957947, "entropy": 0.6957550644874573, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:35:12.159451Z", "loop": 464, "env_steps": 285695999, "loss": 0.016913708299398422, "avg_return": 0.31356725096702576, "regret": 0.49255871772766113, "entropy": 0.696116030216217, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:35:13.331153Z", "loop": 465, "env_steps": 286310399, "loss": 0.01682192273437977, "avg_return": 0.31243351101875305, "regret": 0.49255871772766113, "entropy": 0.6962519884109497, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:35:14.542982Z", "loop": 466, "env_steps": 286924799, "loss": 0.0162365585565567, "avg_return": 0.3111269176006317, "regret": 0.4925209879875183, "entropy": 0.6963161826133728, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:35:15.707963Z", "loop": 467, "env_steps": 287539199, "loss": 0.01642225682735443, "avg_return": 0.3089708983898163, "regret": 0.4925209879875183, "entropy": 0.6963070034980774, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:35:16.917784Z", "loop": 468, "env_steps": 288153599, "loss": 0.016690485179424286, "avg_return": 0.31151440739631653, "regret": 0.4925413727760315, "entropy": 0.6963184475898743, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:35:18.077685Z", "loop": 469, "env_steps": 288767999, "loss": 0.016187965869903564, "avg_return": 0.31191834807395935, "regret": 0.4925413727760315, "entropy": 0.696287989616394, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:35:19.277943Z", "loop": 470, "env_steps": 289382399, "loss": 0.01639716885983944, "avg_return": 0.3114408850669861, "regret": 0.4925404191017151, "entropy": 0.6963260769844055, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:35:20.438377Z", "loop": 471, "env_steps": 289996799, "loss": 0.0176213551312685, "avg_return": 0.31407904624938965, "regret": 0.4925404191017151, "entropy": 0.6963512897491455, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:35:21.639330Z", "loop": 472, "env_steps": 290611199, "loss": 0.016477486118674278, "avg_return": 0.31288111209869385, "regret": 0.4925253987312317, "entropy": 0.6963359713554382, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:35:22.804993Z", "loop": 473, "env_steps": 291225599, "loss": 0.01686919294297695, "avg_return": 0.3127897083759308, "regret": 0.4925253987312317, "entropy": 0.6963458061218262, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:35:24.014875Z", "loop": 474, "env_steps": 291839999, "loss": 0.017278140410780907, "avg_return": 0.3128446638584137, "regret": 0.49252215027809143, "entropy": 0.696371853351593, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:35:25.176174Z", "loop": 475, "env_steps": 292454399, "loss": 0.01610521785914898, "avg_return": 0.3132004737854004, "regret": 0.49252215027809143, "entropy": 0.6963686943054199, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:35:26.376274Z", "loop": 476, "env_steps": 293068799, "loss": 0.01630844548344612, "avg_return": 0.3136565685272217, "regret": 0.4925236701965332, "entropy": 0.696394681930542, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:35:27.537721Z", "loop": 477, "env_steps": 293683199, "loss": 0.016439301893115044, "avg_return": 0.312806636095047, "regret": 0.4925236701965332, "entropy": 0.6964006423950195, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:35:28.739295Z", "loop": 478, "env_steps": 294297599, "loss": 0.01615222357213497, "avg_return": 0.3126441538333893, "regret": 0.4925273060798645, "entropy": 0.6963927149772644, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:35:29.899777Z", "loop": 479, "env_steps": 294911999, "loss": 0.015108969993889332, "avg_return": 0.30778738856315613, "regret": 0.4925273060798645, "entropy": 0.6964161396026611, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:35:31.108210Z", "loop": 480, "env_steps": 295526399, "loss": 0.016037866473197937, "avg_return": 0.31006941199302673, "regret": 0.49251845479011536, "entropy": 0.6964250206947327, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:35:32.274149Z", "loop": 481, "env_steps": 296140799, "loss": 0.01564423181116581, "avg_return": 0.3134056031703949, "regret": 0.49251845479011536, "entropy": 0.6964096426963806, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:35:33.478991Z", "loop": 482, "env_steps": 296755199, "loss": 0.016280097886919975, "avg_return": 0.3114534616470337, "regret": 0.4925229847431183, "entropy": 0.6964346766471863, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:35:34.638995Z", "loop": 483, "env_steps": 297369599, "loss": 0.01745772175490856, "avg_return": 0.3101697862148285, "regret": 0.4925229847431183, "entropy": 0.6964367628097534, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:35:35.842318Z", "loop": 484, "env_steps": 297983999, "loss": 0.01634278893470764, "avg_return": 0.3174423277378082, "regret": 0.4925287067890167, "entropy": 0.696401834487915, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:35:37.004353Z", "loop": 485, "env_steps": 298598399, "loss": 0.01627117209136486, "avg_return": 0.3167300522327423, "regret": 0.4925287067890167, "entropy": 0.696266770362854, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:35:38.207490Z", "loop": 486, "env_steps": 299212799, "loss": 0.015492054633796215, "avg_return": 0.3109307289123535, "regret": 0.49258702993392944, "entropy": 0.6961781978607178, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:35:39.368247Z", "loop": 487, "env_steps": 299827199, "loss": 0.016506213694810867, "avg_return": 0.31712454557418823, "regret": 0.49258702993392944, "entropy": 0.6960625052452087, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:35:40.568264Z", "loop": 488, "env_steps": 300441599, "loss": 0.016536816954612732, "avg_return": 0.3158915042877197, "regret": 0.4925541281700134, "entropy": 0.6962236166000366, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:35:41.727039Z", "loop": 489, "env_steps": 301055999, "loss": 0.01613016426563263, "avg_return": 0.30983269214630127, "regret": 0.4925541281700134, "entropy": 0.6964449882507324, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:35:42.927139Z", "loop": 490, "env_steps": 301670399, "loss": 0.015291414223611355, "avg_return": 0.30480527877807617, "regret": 0.4925503432750702, "entropy": 0.6963468194007874, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:35:44.089652Z", "loop": 491, "env_steps": 302284799, "loss": 0.016791759058833122, "avg_return": 0.30587291717529297, "regret": 0.4925503432750702, "entropy": 0.6961760520935059, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:35:45.291315Z", "loop": 492, "env_steps": 302899199, "loss": 0.016970349475741386, "avg_return": 0.3087104856967926, "regret": 0.4926539361476898, "entropy": 0.6959608793258667, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:35:46.455828Z", "loop": 493, "env_steps": 303513599, "loss": 0.0173958670347929, "avg_return": 0.30532482266426086, "regret": 0.4926539361476898, "entropy": 0.6958033442497253, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:35:47.670078Z", "loop": 494, "env_steps": 304127999, "loss": 0.01763075217604637, "avg_return": 0.3148888647556305, "regret": 0.49262571334838867, "entropy": 0.6959545612335205, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:35:48.833555Z", "loop": 495, "env_steps": 304742399, "loss": 0.015268600545823574, "avg_return": 0.3035808503627777, "regret": 0.49262571334838867, "entropy": 0.6961837410926819, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:35:50.034659Z", "loop": 496, "env_steps": 305356799, "loss": 0.016594188287854195, "avg_return": 0.31619998812675476, "regret": 0.49249517917633057, "entropy": 0.6962767839431763, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:35:51.195254Z", "loop": 497, "env_steps": 305971199, "loss": 0.016894405707716942, "avg_return": 0.3048992156982422, "regret": 0.49249517917633057, "entropy": 0.6961772441864014, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:35:52.396124Z", "loop": 498, "env_steps": 306585599, "loss": 0.016016701236367226, "avg_return": 0.3094595670700073, "regret": 0.49264293909072876, "entropy": 0.6957036852836609, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:35:53.556212Z", "loop": 499, "env_steps": 307199999, "loss": 0.01719731278717518, "avg_return": 0.30776819586753845, "regret": 0.49264293909072876, "entropy": 0.6946069598197937, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:35:54.758599Z", "loop": 500, "env_steps": 307814399, "loss": 0.017246143892407417, "avg_return": 0.3105911910533905, "regret": 0.49328282475471497, "entropy": 0.6934671401977539, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:35:55.918058Z", "loop": 501, "env_steps": 308428799, "loss": 0.01705520786345005, "avg_return": 0.3075341284275055, "regret": 0.49328282475471497, "entropy": 0.6922065019607544, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:35:57.078395Z", "loop": 502, "env_steps": 309043199, "loss": 0.01656501181423664, "avg_return": 0.31264394521713257, "regret": 0.49328282475471497, "entropy": 0.691483199596405, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:35:58.237323Z", "loop": 503, "env_steps": 309657599, "loss": 0.017318686470389366, "avg_return": 0.30670154094696045, "regret": 0.49328282475471497, "entropy": 0.6916612386703491, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:35:59.396994Z", "loop": 504, "env_steps": 310271999, "loss": 0.017171286046504974, "avg_return": 0.31114405393600464, "regret": 0.49328282475471497, "entropy": 0.6927907466888428, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:36:00.607567Z", "loop": 505, "env_steps": 310886399, "loss": 0.017042066901922226, "avg_return": 0.31458547711372375, "regret": 0.4930563271045685, "entropy": 0.6945207118988037, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:36:01.771190Z", "loop": 506, "env_steps": 311500799, "loss": 0.015687905251979828, "avg_return": 0.3100052773952484, "regret": 0.4930563271045685, "entropy": 0.6961089968681335, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:36:02.932003Z", "loop": 507, "env_steps": 312115199, "loss": 0.01632452756166458, "avg_return": 0.31273674964904785, "regret": 0.4930563271045685, "entropy": 0.6967007517814636, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:36:04.091527Z", "loop": 508, "env_steps": 312729599, "loss": 0.017301596701145172, "avg_return": 0.3059872090816498, "regret": 0.4930563271045685, "entropy": 0.6963706612586975, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:36:05.250675Z", "loop": 509, "env_steps": 313343999, "loss": 0.016215680167078972, "avg_return": 0.3105640113353729, "regret": 0.4930563271045685, "entropy": 0.6955415606498718, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:36:06.450964Z", "loop": 510, "env_steps": 313958399, "loss": 0.01725376956164837, "avg_return": 0.3162800669670105, "regret": 0.4932119846343994, "entropy": 0.6946220993995667, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:36:07.610144Z", "loop": 511, "env_steps": 314572799, "loss": 0.015742167830467224, "avg_return": 0.30734387040138245, "regret": 0.4932119846343994, "entropy": 0.6943674087524414, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:36:08.773454Z", "loop": 512, "env_steps": 315187199, "loss": 0.01688598282635212, "avg_return": 0.30708202719688416, "regret": 0.4932119846343994, "entropy": 0.6947987675666809, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:36:09.933807Z", "loop": 513, "env_steps": 315801599, "loss": 0.01715679094195366, "avg_return": 0.30989739298820496, "regret": 0.4932119846343994, "entropy": 0.6953860521316528, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:36:11.093382Z", "loop": 514, "env_steps": 316415999, "loss": 0.01671198382973671, "avg_return": 0.31388726830482483, "regret": 0.4932119846343994, "entropy": 0.6961653232574463, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:36:12.297615Z", "loop": 515, "env_steps": 317030399, "loss": 0.016404399648308754, "avg_return": 0.313717246055603, "regret": 0.49256831407546997, "entropy": 0.6968571543693542, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:36:13.458055Z", "loop": 516, "env_steps": 317644799, "loss": 0.01704874448478222, "avg_return": 0.30625560879707336, "regret": 0.49256831407546997, "entropy": 0.6970745325088501, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:36:14.621106Z", "loop": 517, "env_steps": 318259199, "loss": 0.016020068898797035, "avg_return": 0.3069370985031128, "regret": 0.49256831407546997, "entropy": 0.6966395378112793, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:36:15.783197Z", "loop": 518, "env_steps": 318873599, "loss": 0.01615065522491932, "avg_return": 0.30911919474601746, "regret": 0.49256831407546997, "entropy": 0.6959400773048401, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:36:16.943040Z", "loop": 519, "env_steps": 319487999, "loss": 0.01626483164727688, "avg_return": 0.3027098774909973, "regret": 0.49256831407546997, "entropy": 0.6951233744621277, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:36:18.142676Z", "loop": 520, "env_steps": 320102399, "loss": 0.0163688026368618, "avg_return": 0.3079438805580139, "regret": 0.49327462911605835, "entropy": 0.6942636370658875, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:36:19.301780Z", "loop": 521, "env_steps": 320716799, "loss": 0.016162332147359848, "avg_return": 0.3102547228336334, "regret": 0.49327462911605835, "entropy": 0.6934607625007629, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:36:20.461664Z", "loop": 522, "env_steps": 321331199, "loss": 0.016508419066667557, "avg_return": 0.31156104803085327, "regret": 0.49327462911605835, "entropy": 0.6935985684394836, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:36:21.624096Z", "loop": 523, "env_steps": 321945599, "loss": 0.016929829493165016, "avg_return": 0.3098456859588623, "regret": 0.49327462911605835, "entropy": 0.6939730048179626, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:36:22.785477Z", "loop": 524, "env_steps": 322559999, "loss": 0.01715841330587864, "avg_return": 0.3120495676994324, "regret": 0.49327462911605835, "entropy": 0.6946753263473511, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:36:23.994683Z", "loop": 525, "env_steps": 323174399, "loss": 0.01628809981048107, "avg_return": 0.30526450276374817, "regret": 0.49279356002807617, "entropy": 0.6957765221595764, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:36:25.153688Z", "loop": 526, "env_steps": 323788799, "loss": 0.01639726758003235, "avg_return": 0.3120439946651459, "regret": 0.49279356002807617, "entropy": 0.6965996026992798, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:36:26.312024Z", "loop": 527, "env_steps": 324403199, "loss": 0.016816411167383194, "avg_return": 0.31551429629325867, "regret": 0.49279356002807617, "entropy": 0.6969382166862488, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:36:27.470543Z", "loop": 528, "env_steps": 325017599, "loss": 0.016048697754740715, "avg_return": 0.30986857414245605, "regret": 0.49279356002807617, "entropy": 0.6967504620552063, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:36:28.628296Z", "loop": 529, "env_steps": 325631999, "loss": 0.016766251996159554, "avg_return": 0.3104027807712555, "regret": 0.49279356002807617, "entropy": 0.6962445974349976, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:36:29.826731Z", "loop": 530, "env_steps": 326246399, "loss": 0.01583981327712536, "avg_return": 0.3112902045249939, "regret": 0.4929283857345581, "entropy": 0.6955939531326294, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:36:30.985521Z", "loop": 531, "env_steps": 326860799, "loss": 0.016324525699019432, "avg_return": 0.31055623292922974, "regret": 0.4929283857345581, "entropy": 0.6952843070030212, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:36:32.144891Z", "loop": 532, "env_steps": 327475199, "loss": 0.016379443928599358, "avg_return": 0.3097721040248871, "regret": 0.4929283857345581, "entropy": 0.6948202848434448, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:36:33.305583Z", "loop": 533, "env_steps": 328089599, "loss": 0.016902035102248192, "avg_return": 0.3067075312137604, "regret": 0.4929283857345581, "entropy": 0.6945659518241882, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:36:34.464219Z", "loop": 534, "env_steps": 328703999, "loss": 0.016128497198224068, "avg_return": 0.30882909893989563, "regret": 0.4929283857345581, "entropy": 0.6947662234306335, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:36:35.663120Z", "loop": 535, "env_steps": 329318399, "loss": 0.017870379611849785, "avg_return": 0.3055303394794464, "regret": 0.49304455518722534, "entropy": 0.6948920488357544, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:36:36.827842Z", "loop": 536, "env_steps": 329932799, "loss": 0.017320210114121437, "avg_return": 0.3122021555900574, "regret": 0.49304455518722534, "entropy": 0.6954567432403564, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:36:37.987039Z", "loop": 537, "env_steps": 330547199, "loss": 0.016647376120090485, "avg_return": 0.308551162481308, "regret": 0.49304455518722534, "entropy": 0.6958872079849243, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:36:39.146528Z", "loop": 538, "env_steps": 331161599, "loss": 0.017030756920576096, "avg_return": 0.30807214975357056, "regret": 0.49304455518722534, "entropy": 0.6960402727127075, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:36:40.305502Z", "loop": 539, "env_steps": 331775999, "loss": 0.01743503287434578, "avg_return": 0.31564223766326904, "regret": 0.49304455518722534, "entropy": 0.6962119340896606, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:36:41.513617Z", "loop": 540, "env_steps": 332390399, "loss": 0.01747177541255951, "avg_return": 0.3091261088848114, "regret": 0.49249616265296936, "entropy": 0.696336567401886, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:36:42.690462Z", "loop": 541, "env_steps": 333004799, "loss": 0.01608145795762539, "avg_return": 0.30893850326538086, "regret": 0.49249616265296936, "entropy": 0.6963644623756409, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:36:43.849771Z", "loop": 542, "env_steps": 333619199, "loss": 0.017067311331629753, "avg_return": 0.31980496644973755, "regret": 0.49249616265296936, "entropy": 0.6962531208992004, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:36:45.012274Z", "loop": 543, "env_steps": 334233599, "loss": 0.017729027196764946, "avg_return": 0.3164275288581848, "regret": 0.49249616265296936, "entropy": 0.6959506273269653, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:36:46.174931Z", "loop": 544, "env_steps": 334847999, "loss": 0.015760116279125214, "avg_return": 0.3110441267490387, "regret": 0.49249616265296936, "entropy": 0.6954630613327026, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:36:47.380795Z", "loop": 545, "env_steps": 335462399, "loss": 0.016861174255609512, "avg_return": 0.3075696527957916, "regret": 0.4927213490009308, "entropy": 0.6953686475753784, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:36:48.542015Z", "loop": 546, "env_steps": 336076799, "loss": 0.016594447195529938, "avg_return": 0.30851441621780396, "regret": 0.4927213490009308, "entropy": 0.6956239342689514, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:36:49.701832Z", "loop": 547, "env_steps": 336691199, "loss": 0.01658959873020649, "avg_return": 0.3097989857196808, "regret": 0.4927213490009308, "entropy": 0.6958306431770325, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:36:50.863839Z", "loop": 548, "env_steps": 337305599, "loss": 0.01714397594332695, "avg_return": 0.30476635694503784, "regret": 0.4927213490009308, "entropy": 0.6961047649383545, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:36:52.032393Z", "loop": 549, "env_steps": 337919999, "loss": 0.01686430349946022, "avg_return": 0.3130221962928772, "regret": 0.4927213490009308, "entropy": 0.696301281452179, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:36:53.238253Z", "loop": 550, "env_steps": 338534399, "loss": 0.016587769612669945, "avg_return": 0.305254191160202, "regret": 0.4925095736980438, "entropy": 0.6961342096328735, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:36:54.398920Z", "loop": 551, "env_steps": 339148799, "loss": 0.01661698892712593, "avg_return": 0.3079410195350647, "regret": 0.4925095736980438, "entropy": 0.6956206560134888, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:36:55.559728Z", "loop": 552, "env_steps": 339763199, "loss": 0.01667756214737892, "avg_return": 0.31497055292129517, "regret": 0.4925095736980438, "entropy": 0.6947072744369507, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:36:56.720538Z", "loop": 553, "env_steps": 340377599, "loss": 0.016664979979395866, "avg_return": 0.31626057624816895, "regret": 0.4925095736980438, "entropy": 0.6939861178398132, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:36:57.884679Z", "loop": 554, "env_steps": 340991999, "loss": 0.016886362805962563, "avg_return": 0.3140520751476288, "regret": 0.4925095736980438, "entropy": 0.6936213970184326, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:36:59.103868Z", "loop": 555, "env_steps": 341606399, "loss": 0.017103571444749832, "avg_return": 0.30966025590896606, "regret": 0.49333032965660095, "entropy": 0.6936245560646057, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:37:00.266270Z", "loop": 556, "env_steps": 342220799, "loss": 0.016837162896990776, "avg_return": 0.3135521411895752, "regret": 0.49333032965660095, "entropy": 0.694327712059021, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:37:01.426905Z", "loop": 557, "env_steps": 342835199, "loss": 0.016104960814118385, "avg_return": 0.31718164682388306, "regret": 0.49333032965660095, "entropy": 0.6949062943458557, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:37:02.585283Z", "loop": 558, "env_steps": 343449599, "loss": 0.01650049351155758, "avg_return": 0.3018137216567993, "regret": 0.49333032965660095, "entropy": 0.6954472064971924, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:37:03.743608Z", "loop": 559, "env_steps": 344063999, "loss": 0.01683369092643261, "avg_return": 0.30918440222740173, "regret": 0.49333032965660095, "entropy": 0.6959127187728882, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:37:04.956315Z", "loop": 560, "env_steps": 344678399, "loss": 0.018058132380247116, "avg_return": 0.31891536712646484, "regret": 0.4926378130912781, "entropy": 0.696146547794342, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:37:06.123438Z", "loop": 561, "env_steps": 345292799, "loss": 0.016471458598971367, "avg_return": 0.3048069477081299, "regret": 0.4926378130912781, "entropy": 0.6965721249580383, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:37:07.283084Z", "loop": 562, "env_steps": 345907199, "loss": 0.015982111915946007, "avg_return": 0.3192908763885498, "regret": 0.4926378130912781, "entropy": 0.6967149972915649, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:37:08.442098Z", "loop": 563, "env_steps": 346521599, "loss": 0.016642514616250992, "avg_return": 0.3073362708091736, "regret": 0.4926378130912781, "entropy": 0.6968258023262024, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:37:09.601868Z", "loop": 564, "env_steps": 347135999, "loss": 0.01776607148349285, "avg_return": 0.3126242458820343, "regret": 0.4926378130912781, "entropy": 0.6969054937362671, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:37:10.804025Z", "loop": 565, "env_steps": 347750399, "loss": 0.017036302015185356, "avg_return": 0.3144218623638153, "regret": 0.4924639165401459, "entropy": 0.6970181465148926, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:37:11.967863Z", "loop": 566, "env_steps": 348364799, "loss": 0.01562628336250782, "avg_return": 0.3042997419834137, "regret": 0.4924639165401459, "entropy": 0.6970680356025696, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:37:13.134003Z", "loop": 567, "env_steps": 348979199, "loss": 0.016162460669875145, "avg_return": 0.31526169180870056, "regret": 0.4924639165401459, "entropy": 0.6970963478088379, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:37:14.298142Z", "loop": 568, "env_steps": 349593599, "loss": 0.01736440137028694, "avg_return": 0.3158068358898163, "regret": 0.4924639165401459, "entropy": 0.6971126794815063, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:37:15.458273Z", "loop": 569, "env_steps": 350207999, "loss": 0.016346557065844536, "avg_return": 0.3094591200351715, "regret": 0.4924639165401459, "entropy": 0.6971037983894348, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:37:16.660875Z", "loop": 570, "env_steps": 350822399, "loss": 0.016321850940585136, "avg_return": 0.31030258536338806, "regret": 0.49252796173095703, "entropy": 0.6971085071563721, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:37:17.824091Z", "loop": 571, "env_steps": 351436799, "loss": 0.015390351414680481, "avg_return": 0.30870625376701355, "regret": 0.49252796173095703, "entropy": 0.6972116231918335, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:37:18.987632Z", "loop": 572, "env_steps": 352051199, "loss": 0.016254784539341927, "avg_return": 0.3059062361717224, "regret": 0.49252796173095703, "entropy": 0.6974186301231384, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:37:20.150564Z", "loop": 573, "env_steps": 352665599, "loss": 0.01620902121067047, "avg_return": 0.3133046627044678, "regret": 0.49252796173095703, "entropy": 0.6975113153457642, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:37:21.310815Z", "loop": 574, "env_steps": 353279999, "loss": 0.01787681132555008, "avg_return": 0.30433112382888794, "regret": 0.49252796173095703, "entropy": 0.6975517868995667, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:37:22.515924Z", "loop": 575, "env_steps": 353894399, "loss": 0.015661360695958138, "avg_return": 0.31788915395736694, "regret": 0.49247002601623535, "entropy": 0.6975805163383484, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:37:23.675894Z", "loop": 576, "env_steps": 354508799, "loss": 0.016132069751620293, "avg_return": 0.31171098351478577, "regret": 0.49247002601623535, "entropy": 0.6975633502006531, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:37:24.836272Z", "loop": 577, "env_steps": 355123199, "loss": 0.0160328708589077, "avg_return": 0.30991461873054504, "regret": 0.49247002601623535, "entropy": 0.6975559592247009, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:37:25.995379Z", "loop": 578, "env_steps": 355737599, "loss": 0.016555165871977806, "avg_return": 0.3069031834602356, "regret": 0.49247002601623535, "entropy": 0.6974530816078186, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:37:27.155573Z", "loop": 579, "env_steps": 356351999, "loss": 0.017057061195373535, "avg_return": 0.310287743806839, "regret": 0.49247002601623535, "entropy": 0.6973884701728821, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:37:28.355492Z", "loop": 580, "env_steps": 356966399, "loss": 0.017364628612995148, "avg_return": 0.3119966685771942, "regret": 0.49249517917633057, "entropy": 0.6973591446876526, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:37:29.517345Z", "loop": 581, "env_steps": 357580799, "loss": 0.01664910279214382, "avg_return": 0.3052956163883209, "regret": 0.49249517917633057, "entropy": 0.6973685026168823, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:37:30.681803Z", "loop": 582, "env_steps": 358195199, "loss": 0.016955189406871796, "avg_return": 0.31398555636405945, "regret": 0.49249517917633057, "entropy": 0.6973468661308289, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:37:31.842951Z", "loop": 583, "env_steps": 358809599, "loss": 0.016883132979273796, "avg_return": 0.30892300605773926, "regret": 0.49249517917633057, "entropy": 0.6972860097885132, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:37:33.003003Z", "loop": 584, "env_steps": 359423999, "loss": 0.016180939972400665, "avg_return": 0.30911093950271606, "regret": 0.49249517917633057, "entropy": 0.6972047686576843, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:37:34.207713Z", "loop": 585, "env_steps": 360038399, "loss": 0.017049511894583702, "avg_return": 0.30794233083724976, "regret": 0.49245455861091614, "entropy": 0.6970973014831543, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:37:35.368681Z", "loop": 586, "env_steps": 360652799, "loss": 0.016578104346990585, "avg_return": 0.3115837275981903, "regret": 0.49245455861091614, "entropy": 0.6969270706176758, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:37:36.528780Z", "loop": 587, "env_steps": 361267199, "loss": 0.01687724143266678, "avg_return": 0.30792883038520813, "regret": 0.49245455861091614, "entropy": 0.6966527700424194, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:37:37.687303Z", "loop": 588, "env_steps": 361881599, "loss": 0.017539553344249725, "avg_return": 0.31033527851104736, "regret": 0.49245455861091614, "entropy": 0.6961298584938049, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:37:38.846477Z", "loop": 589, "env_steps": 362495999, "loss": 0.017232032492756844, "avg_return": 0.3182018995285034, "regret": 0.49245455861091614, "entropy": 0.6954754590988159, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:37:40.046858Z", "loop": 590, "env_steps": 363110399, "loss": 0.01624905876815319, "avg_return": 0.31323081254959106, "regret": 0.49294155836105347, "entropy": 0.6950117945671082, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:37:41.206554Z", "loop": 591, "env_steps": 363724799, "loss": 0.016461363062262535, "avg_return": 0.30488693714141846, "regret": 0.49294155836105347, "entropy": 0.6951232552528381, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:37:42.365898Z", "loop": 592, "env_steps": 364339199, "loss": 0.01563822664320469, "avg_return": 0.3109703063964844, "regret": 0.49294155836105347, "entropy": 0.6951832175254822, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:37:43.526208Z", "loop": 593, "env_steps": 364953599, "loss": 0.0164511576294899, "avg_return": 0.3152781128883362, "regret": 0.49294155836105347, "entropy": 0.694891631603241, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:37:44.685186Z", "loop": 594, "env_steps": 365567999, "loss": 0.017664045095443726, "avg_return": 0.3158952593803406, "regret": 0.49294155836105347, "entropy": 0.6949642300605774, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:37:45.886565Z", "loop": 595, "env_steps": 366182399, "loss": 0.01751505397260189, "avg_return": 0.3121553063392639, "regret": 0.4928688406944275, "entropy": 0.6948990821838379, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:37:47.045872Z", "loop": 596, "env_steps": 366796799, "loss": 0.016943974420428276, "avg_return": 0.3124586343765259, "regret": 0.4928688406944275, "entropy": 0.6948404312133789, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:37:48.208305Z", "loop": 597, "env_steps": 367411199, "loss": 0.015255488455295563, "avg_return": 0.3068296015262604, "regret": 0.4928688406944275, "entropy": 0.6953645944595337, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:37:49.368561Z", "loop": 598, "env_steps": 368025599, "loss": 0.018279997631907463, "avg_return": 0.3221686780452728, "regret": 0.4928688406944275, "entropy": 0.6958653926849365, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:37:50.529251Z", "loop": 599, "env_steps": 368639999, "loss": 0.01610337570309639, "avg_return": 0.30745989084243774, "regret": 0.4928688406944275, "entropy": 0.6963021755218506, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:37:51.732331Z", "loop": 600, "env_steps": 369254399, "loss": 0.015010199509561062, "avg_return": 0.30663472414016724, "regret": 0.4924098253250122, "entropy": 0.6963791251182556, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:37:52.893696Z", "loop": 601, "env_steps": 369868799, "loss": 0.01606825925409794, "avg_return": 0.30579039454460144, "regret": 0.4924098253250122, "entropy": 0.6963502764701843, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:37:54.054034Z", "loop": 602, "env_steps": 370483199, "loss": 0.01612101122736931, "avg_return": 0.30907168984413147, "regret": 0.4924098253250122, "entropy": 0.6962630152702332, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:37:55.214847Z", "loop": 603, "env_steps": 371097599, "loss": 0.017131995409727097, "avg_return": 0.31626230478286743, "regret": 0.4924098253250122, "entropy": 0.6959957480430603, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:37:56.374541Z", "loop": 604, "env_steps": 371711999, "loss": 0.017341729253530502, "avg_return": 0.31452327966690063, "regret": 0.4924098253250122, "entropy": 0.6956108808517456, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:37:57.575844Z", "loop": 605, "env_steps": 372326399, "loss": 0.01719515211880207, "avg_return": 0.3121795356273651, "regret": 0.4926232695579529, "entropy": 0.695578932762146, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:37:58.734971Z", "loop": 606, "env_steps": 372940799, "loss": 0.01598007045686245, "avg_return": 0.31034934520721436, "regret": 0.4926232695579529, "entropy": 0.6956387162208557, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:37:59.895281Z", "loop": 607, "env_steps": 373555199, "loss": 0.01614379696547985, "avg_return": 0.31210166215896606, "regret": 0.4926232695579529, "entropy": 0.695914089679718, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:38:01.054477Z", "loop": 608, "env_steps": 374169599, "loss": 0.01657903753221035, "avg_return": 0.3099548816680908, "regret": 0.4926232695579529, "entropy": 0.6961578130722046, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:38:02.214536Z", "loop": 609, "env_steps": 374783999, "loss": 0.01768423803150654, "avg_return": 0.3165428340435028, "regret": 0.4926232695579529, "entropy": 0.6962987184524536, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:38:03.413689Z", "loop": 610, "env_steps": 375398399, "loss": 0.017403913661837578, "avg_return": 0.3127284646034241, "regret": 0.4924430251121521, "entropy": 0.6961281895637512, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:38:04.577743Z", "loop": 611, "env_steps": 376012799, "loss": 0.017700260505080223, "avg_return": 0.3129948377609253, "regret": 0.4924430251121521, "entropy": 0.6955984830856323, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:38:05.736973Z", "loop": 612, "env_steps": 376627199, "loss": 0.016575777903199196, "avg_return": 0.3063414394855499, "regret": 0.4924430251121521, "entropy": 0.69505774974823, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:38:06.897962Z", "loop": 613, "env_steps": 377241599, "loss": 0.01708449423313141, "avg_return": 0.30954253673553467, "regret": 0.4924430251121521, "entropy": 0.6952162981033325, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:38:08.058769Z", "loop": 614, "env_steps": 377855999, "loss": 0.015430326573550701, "avg_return": 0.31059104204177856, "regret": 0.4924430251121521, "entropy": 0.6958298087120056, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:38:09.261688Z", "loop": 615, "env_steps": 378470399, "loss": 0.016197163611650467, "avg_return": 0.3019234240055084, "regret": 0.49243858456611633, "entropy": 0.6963917016983032, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:38:10.422529Z", "loop": 616, "env_steps": 379084799, "loss": 0.016357416287064552, "avg_return": 0.30877992510795593, "regret": 0.49243858456611633, "entropy": 0.6966280937194824, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:38:11.585466Z", "loop": 617, "env_steps": 379699199, "loss": 0.01667874865233898, "avg_return": 0.30336877703666687, "regret": 0.49243858456611633, "entropy": 0.6965909600257874, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:38:12.744520Z", "loop": 618, "env_steps": 380313599, "loss": 0.017109347507357597, "avg_return": 0.30921465158462524, "regret": 0.49243858456611633, "entropy": 0.6963931322097778, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:38:13.904856Z", "loop": 619, "env_steps": 380927999, "loss": 0.01640981063246727, "avg_return": 0.3100528419017792, "regret": 0.49243858456611633, "entropy": 0.6961873769760132, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:38:15.107100Z", "loop": 620, "env_steps": 381542399, "loss": 0.01865389384329319, "avg_return": 0.3182539641857147, "regret": 0.49252739548683167, "entropy": 0.6961336135864258, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:38:16.268225Z", "loop": 621, "env_steps": 382156799, "loss": 0.01649133302271366, "avg_return": 0.30998170375823975, "regret": 0.49252739548683167, "entropy": 0.6961800456047058, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:38:17.427913Z", "loop": 622, "env_steps": 382771199, "loss": 0.015939239412546158, "avg_return": 0.3087581694126129, "regret": 0.49252739548683167, "entropy": 0.6963644027709961, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:38:18.587406Z", "loop": 623, "env_steps": 383385599, "loss": 0.016520386561751366, "avg_return": 0.3092638850212097, "regret": 0.49252739548683167, "entropy": 0.6964712142944336, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:38:19.746005Z", "loop": 624, "env_steps": 383999999, "loss": 0.016421275213360786, "avg_return": 0.3086485266685486, "regret": 0.49252739548683167, "entropy": 0.6963670253753662, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:38:20.947153Z", "loop": 625, "env_steps": 384614399, "loss": 0.0158951785415411, "avg_return": 0.31644299626350403, "regret": 0.4925045967102051, "entropy": 0.6959079504013062, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:38:22.107655Z", "loop": 626, "env_steps": 385228799, "loss": 0.016695581376552582, "avg_return": 0.3090836703777313, "regret": 0.4925045967102051, "entropy": 0.6954070329666138, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:38:23.268236Z", "loop": 627, "env_steps": 385843199, "loss": 0.017252590507268906, "avg_return": 0.31050002574920654, "regret": 0.4925045967102051, "entropy": 0.6949758529663086, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:38:24.427863Z", "loop": 628, "env_steps": 386457599, "loss": 0.016748547554016113, "avg_return": 0.3132176697254181, "regret": 0.4925045967102051, "entropy": 0.6951742172241211, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:38:25.588002Z", "loop": 629, "env_steps": 387071999, "loss": 0.016580598428845406, "avg_return": 0.30739468336105347, "regret": 0.4925045967102051, "entropy": 0.6955150961875916, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:38:26.789083Z", "loop": 630, "env_steps": 387686399, "loss": 0.016259504482150078, "avg_return": 0.30731597542762756, "regret": 0.49242642521858215, "entropy": 0.6960495710372925, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:38:27.951000Z", "loop": 631, "env_steps": 388300799, "loss": 0.016636667773127556, "avg_return": 0.31181445717811584, "regret": 0.49242642521858215, "entropy": 0.6962783336639404, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:38:29.111888Z", "loop": 632, "env_steps": 388915199, "loss": 0.017576295882463455, "avg_return": 0.31986337900161743, "regret": 0.49242642521858215, "entropy": 0.6962026357650757, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:38:30.272522Z", "loop": 633, "env_steps": 389529599, "loss": 0.014838899485766888, "avg_return": 0.3068041205406189, "regret": 0.49242642521858215, "entropy": 0.6958416700363159, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:38:31.432782Z", "loop": 634, "env_steps": 390143999, "loss": 0.01638464815914631, "avg_return": 0.31588903069496155, "regret": 0.49242642521858215, "entropy": 0.6955429315567017, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:38:32.642897Z", "loop": 635, "env_steps": 390758399, "loss": 0.016719358041882515, "avg_return": 0.3218795955181122, "regret": 0.49263796210289, "entropy": 0.6951998472213745, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:38:33.802763Z", "loop": 636, "env_steps": 391372799, "loss": 0.01588117517530918, "avg_return": 0.30789586901664734, "regret": 0.49263796210289, "entropy": 0.6949793696403503, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:38:34.963516Z", "loop": 637, "env_steps": 391987199, "loss": 0.016225462779402733, "avg_return": 0.3079075813293457, "regret": 0.49263796210289, "entropy": 0.6949581503868103, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:38:36.123021Z", "loop": 638, "env_steps": 392601599, "loss": 0.01597827486693859, "avg_return": 0.30517128109931946, "regret": 0.49263796210289, "entropy": 0.6951431632041931, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:38:37.282676Z", "loop": 639, "env_steps": 393215999, "loss": 0.016519034281373024, "avg_return": 0.3148690462112427, "regret": 0.49263796210289, "entropy": 0.6954483389854431, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:38:38.485180Z", "loop": 640, "env_steps": 393830399, "loss": 0.015612444840371609, "avg_return": 0.30698856711387634, "regret": 0.49241018295288086, "entropy": 0.6956543326377869, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:38:39.646091Z", "loop": 641, "env_steps": 394444799, "loss": 0.01795598678290844, "avg_return": 0.31003183126449585, "regret": 0.49241018295288086, "entropy": 0.6957477927207947, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:38:40.806315Z", "loop": 642, "env_steps": 395059199, "loss": 0.01640891842544079, "avg_return": 0.314648300409317, "regret": 0.49241018295288086, "entropy": 0.6957899928092957, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:38:41.967517Z", "loop": 643, "env_steps": 395673599, "loss": 0.017178233712911606, "avg_return": 0.31243962049484253, "regret": 0.49241018295288086, "entropy": 0.6956151723861694, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:38:43.130409Z", "loop": 644, "env_steps": 396287999, "loss": 0.016216641291975975, "avg_return": 0.311274915933609, "regret": 0.49241018295288086, "entropy": 0.6949921250343323, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:38:44.332970Z", "loop": 645, "env_steps": 396902399, "loss": 0.017208216711878777, "avg_return": 0.3179856538772583, "regret": 0.4928918182849884, "entropy": 0.6936097145080566, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:38:45.492473Z", "loop": 646, "env_steps": 397516799, "loss": 0.0176984965801239, "avg_return": 0.3065594434738159, "regret": 0.4928918182849884, "entropy": 0.6922817826271057, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:38:46.651784Z", "loop": 647, "env_steps": 398131199, "loss": 0.015520674176514149, "avg_return": 0.30692434310913086, "regret": 0.4928918182849884, "entropy": 0.6922414302825928, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:38:47.812141Z", "loop": 648, "env_steps": 398745599, "loss": 0.016065528616309166, "avg_return": 0.3064785301685333, "regret": 0.4928918182849884, "entropy": 0.6925634741783142, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:38:48.973135Z", "loop": 649, "env_steps": 399359999, "loss": 0.016675172373652458, "avg_return": 0.30977627635002136, "regret": 0.4928918182849884, "entropy": 0.6930227279663086, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:38:50.178196Z", "loop": 650, "env_steps": 399974399, "loss": 0.016048969700932503, "avg_return": 0.3089749813079834, "regret": 0.49281397461891174, "entropy": 0.6937240362167358, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:38:51.337101Z", "loop": 651, "env_steps": 400588799, "loss": 0.01577073521912098, "avg_return": 0.3054182529449463, "regret": 0.49281397461891174, "entropy": 0.6946489810943604, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:38:52.496625Z", "loop": 652, "env_steps": 401203199, "loss": 0.017726322636008263, "avg_return": 0.3229396641254425, "regret": 0.49281397461891174, "entropy": 0.6950258016586304, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:38:53.657433Z", "loop": 653, "env_steps": 401817599, "loss": 0.014566508121788502, "avg_return": 0.3099047541618347, "regret": 0.49281397461891174, "entropy": 0.6952863335609436, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:38:54.818408Z", "loop": 654, "env_steps": 402431999, "loss": 0.016911296173930168, "avg_return": 0.308024138212204, "regret": 0.49281397461891174, "entropy": 0.6954390406608582, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:38:56.019888Z", "loop": 655, "env_steps": 403046399, "loss": 0.01656721532344818, "avg_return": 0.3108706772327423, "regret": 0.4922969937324524, "entropy": 0.6954551935195923, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:38:57.180150Z", "loop": 656, "env_steps": 403660799, "loss": 0.015467317774891853, "avg_return": 0.31109732389450073, "regret": 0.4922969937324524, "entropy": 0.6954138875007629, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:38:58.339480Z", "loop": 657, "env_steps": 404275199, "loss": 0.016231141984462738, "avg_return": 0.31173309683799744, "regret": 0.4922969937324524, "entropy": 0.6953556537628174, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:38:59.500752Z", "loop": 658, "env_steps": 404889599, "loss": 0.016653375700116158, "avg_return": 0.3155839741230011, "regret": 0.4922969937324524, "entropy": 0.6952254176139832, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:39:00.660665Z", "loop": 659, "env_steps": 405503999, "loss": 0.016998058184981346, "avg_return": 0.3166812062263489, "regret": 0.4922969937324524, "entropy": 0.6950316429138184, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:39:01.862383Z", "loop": 660, "env_steps": 406118399, "loss": 0.015770986676216125, "avg_return": 0.3082124888896942, "regret": 0.4923816919326782, "entropy": 0.6949203014373779, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:39:03.021527Z", "loop": 661, "env_steps": 406732799, "loss": 0.016229545697569847, "avg_return": 0.30837753415107727, "regret": 0.4923816919326782, "entropy": 0.6949219703674316, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:39:04.179953Z", "loop": 662, "env_steps": 407347199, "loss": 0.017443837597966194, "avg_return": 0.312020480632782, "regret": 0.4923816919326782, "entropy": 0.6948257684707642, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:39:05.340935Z", "loop": 663, "env_steps": 407961599, "loss": 0.01564027927815914, "avg_return": 0.3069247603416443, "regret": 0.4923816919326782, "entropy": 0.694878339767456, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:39:06.509735Z", "loop": 664, "env_steps": 408575999, "loss": 0.01677796244621277, "avg_return": 0.31109604239463806, "regret": 0.4923816919326782, "entropy": 0.6949881315231323, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:39:07.729083Z", "loop": 665, "env_steps": 409190399, "loss": 0.016001692041754723, "avg_return": 0.30704301595687866, "regret": 0.49227356910705566, "entropy": 0.6950080394744873, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:39:08.890742Z", "loop": 666, "env_steps": 409804799, "loss": 0.015990829095244408, "avg_return": 0.31000906229019165, "regret": 0.49227356910705566, "entropy": 0.6950106620788574, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:39:10.050093Z", "loop": 667, "env_steps": 410419199, "loss": 0.016219817101955414, "avg_return": 0.3118993639945984, "regret": 0.49227356910705566, "entropy": 0.6949177384376526, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:39:11.209799Z", "loop": 668, "env_steps": 411033599, "loss": 0.01604735478758812, "avg_return": 0.3130306899547577, "regret": 0.49227356910705566, "entropy": 0.6948869824409485, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:39:12.368878Z", "loop": 669, "env_steps": 411647999, "loss": 0.018201595172286034, "avg_return": 0.3195229768753052, "regret": 0.49227356910705566, "entropy": 0.6948561668395996, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:39:13.577375Z", "loop": 670, "env_steps": 412262399, "loss": 0.016637442633509636, "avg_return": 0.3104981482028961, "regret": 0.4922589659690857, "entropy": 0.6949074864387512, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:39:14.744926Z", "loop": 671, "env_steps": 412876799, "loss": 0.01605682447552681, "avg_return": 0.3043828010559082, "regret": 0.4922589659690857, "entropy": 0.6949482560157776, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:39:15.911774Z", "loop": 672, "env_steps": 413491199, "loss": 0.01545634400099516, "avg_return": 0.311095654964447, "regret": 0.4922589659690857, "entropy": 0.694886326789856, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:39:17.074298Z", "loop": 673, "env_steps": 414105599, "loss": 0.016522305086255074, "avg_return": 0.3107728064060211, "regret": 0.4922589659690857, "entropy": 0.6947404742240906, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:39:18.234674Z", "loop": 674, "env_steps": 414719999, "loss": 0.01583549939095974, "avg_return": 0.31396612524986267, "regret": 0.4922589659690857, "entropy": 0.6946417093276978, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:39:19.441019Z", "loop": 675, "env_steps": 415334399, "loss": 0.015929361805319786, "avg_return": 0.30928516387939453, "regret": 0.4922811985015869, "entropy": 0.6947191953659058, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:39:20.600970Z", "loop": 676, "env_steps": 415948799, "loss": 0.016418464481830597, "avg_return": 0.30845826864242554, "regret": 0.4922811985015869, "entropy": 0.6948962211608887, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:39:21.760572Z", "loop": 677, "env_steps": 416563199, "loss": 0.01661860942840576, "avg_return": 0.312024861574173, "regret": 0.4922811985015869, "entropy": 0.6949273943901062, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:39:22.919598Z", "loop": 678, "env_steps": 417177599, "loss": 0.016449349001049995, "avg_return": 0.31620296835899353, "regret": 0.4922811985015869, "entropy": 0.6949180364608765, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:39:24.081898Z", "loop": 679, "env_steps": 417791999, "loss": 0.017461637035012245, "avg_return": 0.3067573606967926, "regret": 0.4922811985015869, "entropy": 0.6949430108070374, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:39:25.294638Z", "loop": 680, "env_steps": 418406399, "loss": 0.0171196348965168, "avg_return": 0.31454065442085266, "regret": 0.4922177791595459, "entropy": 0.6949267387390137, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:39:26.455958Z", "loop": 681, "env_steps": 419020799, "loss": 0.01663813553750515, "avg_return": 0.31083041429519653, "regret": 0.4922177791595459, "entropy": 0.6949427723884583, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:39:27.615643Z", "loop": 682, "env_steps": 419635199, "loss": 0.01598413847386837, "avg_return": 0.31630685925483704, "regret": 0.4922177791595459, "entropy": 0.6949189305305481, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:39:28.775900Z", "loop": 683, "env_steps": 420249599, "loss": 0.017991049215197563, "avg_return": 0.3187643587589264, "regret": 0.4922177791595459, "entropy": 0.6948439478874207, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:39:29.934788Z", "loop": 684, "env_steps": 420863999, "loss": 0.016648681834340096, "avg_return": 0.3076641857624054, "regret": 0.4922177791595459, "entropy": 0.6945774555206299, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:39:31.135966Z", "loop": 685, "env_steps": 421478399, "loss": 0.016170594841241837, "avg_return": 0.3082265853881836, "regret": 0.49229565262794495, "entropy": 0.6945405602455139, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:39:32.294768Z", "loop": 686, "env_steps": 422092799, "loss": 0.01638125814497471, "avg_return": 0.3108084499835968, "regret": 0.49229565262794495, "entropy": 0.6945751309394836, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:39:33.454418Z", "loop": 687, "env_steps": 422707199, "loss": 0.017107224091887474, "avg_return": 0.3086143434047699, "regret": 0.49229565262794495, "entropy": 0.6946383714675903, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:39:34.614216Z", "loop": 688, "env_steps": 423321599, "loss": 0.016571132466197014, "avg_return": 0.31536585092544556, "regret": 0.49229565262794495, "entropy": 0.6948639154434204, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:39:35.773568Z", "loop": 689, "env_steps": 423935999, "loss": 0.016487179324030876, "avg_return": 0.30730557441711426, "regret": 0.49229565262794495, "entropy": 0.6949058771133423, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:39:36.984048Z", "loop": 690, "env_steps": 424550399, "loss": 0.016630234196782112, "avg_return": 0.3122320771217346, "regret": 0.49220073223114014, "entropy": 0.6948598027229309, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:39:38.146171Z", "loop": 691, "env_steps": 425164799, "loss": 0.017576348036527634, "avg_return": 0.31233975291252136, "regret": 0.49220073223114014, "entropy": 0.6948034167289734, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:39:39.307658Z", "loop": 692, "env_steps": 425779199, "loss": 0.016763312742114067, "avg_return": 0.315314382314682, "regret": 0.49220073223114014, "entropy": 0.6948473453521729, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:39:40.469014Z", "loop": 693, "env_steps": 426393599, "loss": 0.016550231724977493, "avg_return": 0.3098412752151489, "regret": 0.49220073223114014, "entropy": 0.6948129534721375, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:39:41.629696Z", "loop": 694, "env_steps": 427007999, "loss": 0.017740117385983467, "avg_return": 0.3089825510978699, "regret": 0.49220073223114014, "entropy": 0.6947821378707886, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:39:42.831396Z", "loop": 695, "env_steps": 427622399, "loss": 0.016775429248809814, "avg_return": 0.3124599754810333, "regret": 0.49218133091926575, "entropy": 0.6947624683380127, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:39:43.990915Z", "loop": 696, "env_steps": 428236799, "loss": 0.016395116224884987, "avg_return": 0.31221166253089905, "regret": 0.49218133091926575, "entropy": 0.6946592926979065, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:39:45.150550Z", "loop": 697, "env_steps": 428851199, "loss": 0.01676817610859871, "avg_return": 0.30882787704467773, "regret": 0.49218133091926575, "entropy": 0.6943598985671997, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:39:46.310408Z", "loop": 698, "env_steps": 429465599, "loss": 0.016681643202900887, "avg_return": 0.30630794167518616, "regret": 0.49218133091926575, "entropy": 0.6936563849449158, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:39:47.470696Z", "loop": 699, "env_steps": 430079999, "loss": 0.01675013266503811, "avg_return": 0.3073256015777588, "regret": 0.49218133091926575, "entropy": 0.6926584243774414, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:39:48.674423Z", "loop": 700, "env_steps": 430694399, "loss": 0.01714293099939823, "avg_return": 0.3152834475040436, "regret": 0.49288344383239746, "entropy": 0.6921346187591553, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:39:49.836016Z", "loop": 701, "env_steps": 431308799, "loss": 0.016631316393613815, "avg_return": 0.3136431574821472, "regret": 0.49288344383239746, "entropy": 0.6923806667327881, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:39:50.995618Z", "loop": 702, "env_steps": 431923199, "loss": 0.016943832859396935, "avg_return": 0.31056976318359375, "regret": 0.49288344383239746, "entropy": 0.6931990385055542, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:39:52.158873Z", "loop": 703, "env_steps": 432537599, "loss": 0.016888432204723358, "avg_return": 0.310812383890152, "regret": 0.49288344383239746, "entropy": 0.6938493847846985, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:39:53.319194Z", "loop": 704, "env_steps": 433151999, "loss": 0.016258366405963898, "avg_return": 0.3083299398422241, "regret": 0.49288344383239746, "entropy": 0.6943764090538025, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:39:54.526793Z", "loop": 705, "env_steps": 433766399, "loss": 0.015793805941939354, "avg_return": 0.30930954217910767, "regret": 0.4921457767486572, "entropy": 0.6947004199028015, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:39:55.688856Z", "loop": 706, "env_steps": 434380799, "loss": 0.016414865851402283, "avg_return": 0.3120644986629486, "regret": 0.4921457767486572, "entropy": 0.6947155594825745, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:39:56.848974Z", "loop": 707, "env_steps": 434995199, "loss": 0.016276415437459946, "avg_return": 0.31420379877090454, "regret": 0.4921457767486572, "entropy": 0.6943989396095276, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:39:58.010192Z", "loop": 708, "env_steps": 435609599, "loss": 0.01639578863978386, "avg_return": 0.31155773997306824, "regret": 0.4921457767486572, "entropy": 0.6940620541572571, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:39:59.170460Z", "loop": 709, "env_steps": 436223999, "loss": 0.015276043675839901, "avg_return": 0.30693963170051575, "regret": 0.4921457767486572, "entropy": 0.6935760974884033, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:40:00.371992Z", "loop": 710, "env_steps": 436838399, "loss": 0.016860196366906166, "avg_return": 0.3162895143032074, "regret": 0.4925754964351654, "entropy": 0.6931787133216858, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:40:01.532651Z", "loop": 711, "env_steps": 437452799, "loss": 0.016024531796574593, "avg_return": 0.31310147047042847, "regret": 0.4925754964351654, "entropy": 0.6935641169548035, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:40:02.692568Z", "loop": 712, "env_steps": 438067199, "loss": 0.01655891351401806, "avg_return": 0.3093913793563843, "regret": 0.4925754964351654, "entropy": 0.6939361691474915, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:40:03.852575Z", "loop": 713, "env_steps": 438681599, "loss": 0.016451139003038406, "avg_return": 0.3098496198654175, "regret": 0.4925754964351654, "entropy": 0.6943346261978149, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:40:05.012420Z", "loop": 714, "env_steps": 439295999, "loss": 0.016395634040236473, "avg_return": 0.3087238073348999, "regret": 0.4925754964351654, "entropy": 0.6946396827697754, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:40:06.214091Z", "loop": 715, "env_steps": 439910399, "loss": 0.015715304762125015, "avg_return": 0.3100697994232178, "regret": 0.4921497404575348, "entropy": 0.6944022178649902, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:40:07.375014Z", "loop": 716, "env_steps": 440524799, "loss": 0.017825761809945107, "avg_return": 0.3134112060070038, "regret": 0.4921497404575348, "entropy": 0.6929594278335571, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:40:08.534124Z", "loop": 717, "env_steps": 441139199, "loss": 0.017114045098423958, "avg_return": 0.31190982460975647, "regret": 0.4921497404575348, "entropy": 0.6917453408241272, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:40:09.693943Z", "loop": 718, "env_steps": 441753599, "loss": 0.015515095554292202, "avg_return": 0.30838924646377563, "regret": 0.4921497404575348, "entropy": 0.6922675371170044, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:40:10.852598Z", "loop": 719, "env_steps": 442367999, "loss": 0.015726303681731224, "avg_return": 0.30931100249290466, "regret": 0.4921497404575348, "entropy": 0.6931211352348328, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:40:12.054322Z", "loop": 720, "env_steps": 442982399, "loss": 0.017367662861943245, "avg_return": 0.31465357542037964, "regret": 0.4923170506954193, "entropy": 0.6938948631286621, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:40:13.214030Z", "loop": 721, "env_steps": 443596799, "loss": 0.016735950484871864, "avg_return": 0.3116369843482971, "regret": 0.4923170506954193, "entropy": 0.6945030093193054, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:40:14.375111Z", "loop": 722, "env_steps": 444211199, "loss": 0.01672741398215294, "avg_return": 0.3131084144115448, "regret": 0.4923170506954193, "entropy": 0.6948531270027161, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:40:15.533798Z", "loop": 723, "env_steps": 444825599, "loss": 0.0152378398925066, "avg_return": 0.3114905059337616, "regret": 0.4923170506954193, "entropy": 0.6949166059494019, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:40:16.693931Z", "loop": 724, "env_steps": 445439999, "loss": 0.016566965728998184, "avg_return": 0.3093677759170532, "regret": 0.4923170506954193, "entropy": 0.694875180721283, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:40:17.899021Z", "loop": 725, "env_steps": 446054399, "loss": 0.01633148454129696, "avg_return": 0.31479352712631226, "regret": 0.49209463596343994, "entropy": 0.6949206590652466, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:40:19.059801Z", "loop": 726, "env_steps": 446668799, "loss": 0.016120191663503647, "avg_return": 0.31249696016311646, "regret": 0.49209463596343994, "entropy": 0.6949594020843506, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:40:20.218825Z", "loop": 727, "env_steps": 447283199, "loss": 0.016983235254883766, "avg_return": 0.314959317445755, "regret": 0.49209463596343994, "entropy": 0.6949776411056519, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:40:21.381055Z", "loop": 728, "env_steps": 447897599, "loss": 0.016999829560518265, "avg_return": 0.31342676281929016, "regret": 0.49209463596343994, "entropy": 0.6946931481361389, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:40:22.541951Z", "loop": 729, "env_steps": 448511999, "loss": 0.0171463992446661, "avg_return": 0.3177228271961212, "regret": 0.49209463596343994, "entropy": 0.6945810317993164, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:40:23.746629Z", "loop": 730, "env_steps": 449126399, "loss": 0.01730036549270153, "avg_return": 0.3084650933742523, "regret": 0.4921662211418152, "entropy": 0.6943994164466858, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:40:24.907264Z", "loop": 731, "env_steps": 449740799, "loss": 0.017603321000933647, "avg_return": 0.31580987572669983, "regret": 0.4921662211418152, "entropy": 0.6940357685089111, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:40:26.066683Z", "loop": 732, "env_steps": 450355199, "loss": 0.016704393550753593, "avg_return": 0.3097800314426422, "regret": 0.4921662211418152, "entropy": 0.6935091614723206, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:40:27.231654Z", "loop": 733, "env_steps": 450969599, "loss": 0.01590096950531006, "avg_return": 0.31273624300956726, "regret": 0.4921662211418152, "entropy": 0.6933503746986389, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:40:28.392573Z", "loop": 734, "env_steps": 451583999, "loss": 0.016827978193759918, "avg_return": 0.312333881855011, "regret": 0.4921662211418152, "entropy": 0.693885326385498, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:40:29.597848Z", "loop": 735, "env_steps": 452198399, "loss": 0.017379334196448326, "avg_return": 0.31296414136886597, "regret": 0.492105096578598, "entropy": 0.6943785548210144, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:40:30.758396Z", "loop": 736, "env_steps": 452812799, "loss": 0.016948824748396873, "avg_return": 0.3093113899230957, "regret": 0.492105096578598, "entropy": 0.6947383880615234, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:40:31.917647Z", "loop": 737, "env_steps": 453427199, "loss": 0.016662191599607468, "avg_return": 0.31555044651031494, "regret": 0.492105096578598, "entropy": 0.6948235034942627, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:40:33.077550Z", "loop": 738, "env_steps": 454041599, "loss": 0.016649991273880005, "avg_return": 0.31038007140159607, "regret": 0.492105096578598, "entropy": 0.6947324275970459, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:40:34.236840Z", "loop": 739, "env_steps": 454655999, "loss": 0.016841158270835876, "avg_return": 0.314098060131073, "regret": 0.492105096578598, "entropy": 0.6946574449539185, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:40:35.438902Z", "loop": 740, "env_steps": 455270399, "loss": 0.01661035232245922, "avg_return": 0.3062649667263031, "regret": 0.4920101761817932, "entropy": 0.6947276592254639, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:40:36.598441Z", "loop": 741, "env_steps": 455884799, "loss": 0.016635915264487267, "avg_return": 0.31631195545196533, "regret": 0.4920101761817932, "entropy": 0.6947635412216187, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:40:37.759075Z", "loop": 742, "env_steps": 456499199, "loss": 0.017604930326342583, "avg_return": 0.31015896797180176, "regret": 0.4920101761817932, "entropy": 0.6947801113128662, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:40:38.918392Z", "loop": 743, "env_steps": 457113599, "loss": 0.015850355848670006, "avg_return": 0.311214804649353, "regret": 0.4920101761817932, "entropy": 0.6946998834609985, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:40:40.078357Z", "loop": 744, "env_steps": 457727999, "loss": 0.016804883256554604, "avg_return": 0.30435436964035034, "regret": 0.4920101761817932, "entropy": 0.6946775913238525, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:40:41.278925Z", "loop": 745, "env_steps": 458342399, "loss": 0.016973210498690605, "avg_return": 0.30833083391189575, "regret": 0.4919651746749878, "entropy": 0.6947042346000671, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:40:42.440055Z", "loop": 746, "env_steps": 458956799, "loss": 0.015139803290367126, "avg_return": 0.308210164308548, "regret": 0.4919651746749878, "entropy": 0.6946064233779907, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:40:43.599832Z", "loop": 747, "env_steps": 459571199, "loss": 0.016609255224466324, "avg_return": 0.3119755983352661, "regret": 0.4919651746749878, "entropy": 0.6943556666374207, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:40:44.760695Z", "loop": 748, "env_steps": 460185599, "loss": 0.016133414581418037, "avg_return": 0.31751400232315063, "regret": 0.4919651746749878, "entropy": 0.6942600607872009, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:40:45.919886Z", "loop": 749, "env_steps": 460799999, "loss": 0.016814453527331352, "avg_return": 0.31118321418762207, "regret": 0.4919651746749878, "entropy": 0.6942915320396423, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:40:47.123130Z", "loop": 750, "env_steps": 461414399, "loss": 0.016836337745189667, "avg_return": 0.31265532970428467, "regret": 0.4919790029525757, "entropy": 0.6945514678955078, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:40:48.285105Z", "loop": 751, "env_steps": 462028799, "loss": 0.015467165969312191, "avg_return": 0.3082144856452942, "regret": 0.4919790029525757, "entropy": 0.6948472261428833, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:40:49.446259Z", "loop": 752, "env_steps": 462643199, "loss": 0.01639731042087078, "avg_return": 0.31394922733306885, "regret": 0.4919790029525757, "entropy": 0.6948509216308594, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:40:50.607031Z", "loop": 753, "env_steps": 463257599, "loss": 0.01579432003200054, "avg_return": 0.3127722442150116, "regret": 0.4919790029525757, "entropy": 0.6948266625404358, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:40:51.767555Z", "loop": 754, "env_steps": 463871999, "loss": 0.015998123213648796, "avg_return": 0.30721649527549744, "regret": 0.4919790029525757, "entropy": 0.6948487758636475, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:40:52.971057Z", "loop": 755, "env_steps": 464486399, "loss": 0.01584770902991295, "avg_return": 0.31293803453445435, "regret": 0.49191465973854065, "entropy": 0.6948819756507874, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:40:54.131589Z", "loop": 756, "env_steps": 465100799, "loss": 0.016781121492385864, "avg_return": 0.3152047395706177, "regret": 0.49191465973854065, "entropy": 0.6948747634887695, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:40:55.290463Z", "loop": 757, "env_steps": 465715199, "loss": 0.01828400045633316, "avg_return": 0.3134053945541382, "regret": 0.49191465973854065, "entropy": 0.6944997310638428, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:40:56.450221Z", "loop": 758, "env_steps": 466329599, "loss": 0.017177680507302284, "avg_return": 0.3133920729160309, "regret": 0.49191465973854065, "entropy": 0.6943269371986389, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:40:57.608821Z", "loop": 759, "env_steps": 466943999, "loss": 0.015715455636382103, "avg_return": 0.31193339824676514, "regret": 0.49191465973854065, "entropy": 0.6946757435798645, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:40:58.809873Z", "loop": 760, "env_steps": 467558399, "loss": 0.016184110194444656, "avg_return": 0.3103611469268799, "regret": 0.49188899993896484, "entropy": 0.6949856281280518, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:40:59.969485Z", "loop": 761, "env_steps": 468172799, "loss": 0.015560165047645569, "avg_return": 0.3045417368412018, "regret": 0.49188899993896484, "entropy": 0.6949797868728638, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:41:01.128979Z", "loop": 762, "env_steps": 468787199, "loss": 0.016968606039881706, "avg_return": 0.3160179853439331, "regret": 0.49188899993896484, "entropy": 0.6945677995681763, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:41:02.288829Z", "loop": 763, "env_steps": 469401599, "loss": 0.0169464610517025, "avg_return": 0.3106572926044464, "regret": 0.49188899993896484, "entropy": 0.6939247250556946, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:41:03.448949Z", "loop": 764, "env_steps": 470015999, "loss": 0.016748448833823204, "avg_return": 0.30619341135025024, "regret": 0.49188899993896484, "entropy": 0.6934464573860168, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:41:04.650171Z", "loop": 765, "env_steps": 470630399, "loss": 0.01652577705681324, "avg_return": 0.3101612627506256, "regret": 0.4922119975090027, "entropy": 0.6934736967086792, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:41:05.810807Z", "loop": 766, "env_steps": 471244799, "loss": 0.016034895554184914, "avg_return": 0.31052136421203613, "regret": 0.4922119975090027, "entropy": 0.6940174698829651, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:41:06.970480Z", "loop": 767, "env_steps": 471859199, "loss": 0.016313819214701653, "avg_return": 0.308871328830719, "regret": 0.4922119975090027, "entropy": 0.6946918964385986, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:41:08.131196Z", "loop": 768, "env_steps": 472473599, "loss": 0.01664065197110176, "avg_return": 0.31101787090301514, "regret": 0.4922119975090027, "entropy": 0.6948716640472412, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:41:09.291234Z", "loop": 769, "env_steps": 473087999, "loss": 0.016621777787804604, "avg_return": 0.3097572922706604, "regret": 0.4922119975090027, "entropy": 0.6947149634361267, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:41:10.492971Z", "loop": 770, "env_steps": 473702399, "loss": 0.018072981387376785, "avg_return": 0.3183536231517792, "regret": 0.4919634759426117, "entropy": 0.6943662762641907, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:41:11.656702Z", "loop": 771, "env_steps": 474316799, "loss": 0.01634824648499489, "avg_return": 0.3121441602706909, "regret": 0.4919634759426117, "entropy": 0.6940414309501648, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:41:12.816678Z", "loop": 772, "env_steps": 474931199, "loss": 0.01843874715268612, "avg_return": 0.31676483154296875, "regret": 0.4919634759426117, "entropy": 0.6935520768165588, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:41:13.976803Z", "loop": 773, "env_steps": 475545599, "loss": 0.015501393936574459, "avg_return": 0.3126826584339142, "regret": 0.4919634759426117, "entropy": 0.6936936378479004, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:41:15.138767Z", "loop": 774, "env_steps": 476159999, "loss": 0.017903588712215424, "avg_return": 0.31611043214797974, "regret": 0.4919634759426117, "entropy": 0.6943222284317017, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:41:16.353736Z", "loop": 775, "env_steps": 476774399, "loss": 0.015748128294944763, "avg_return": 0.3167897164821625, "regret": 0.49178266525268555, "entropy": 0.6947193741798401, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:41:17.516041Z", "loop": 776, "env_steps": 477388799, "loss": 0.017628371715545654, "avg_return": 0.31535834074020386, "regret": 0.49178266525268555, "entropy": 0.6947274804115295, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:41:18.683574Z", "loop": 777, "env_steps": 478003199, "loss": 0.016017071902751923, "avg_return": 0.3138295114040375, "regret": 0.49178266525268555, "entropy": 0.6943901777267456, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:41:19.846997Z", "loop": 778, "env_steps": 478617599, "loss": 0.016934067010879517, "avg_return": 0.31547611951828003, "regret": 0.49178266525268555, "entropy": 0.6941578388214111, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:41:21.008039Z", "loop": 779, "env_steps": 479231999, "loss": 0.017682893201708794, "avg_return": 0.30795684456825256, "regret": 0.49178266525268555, "entropy": 0.6941711902618408, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:41:22.214313Z", "loop": 780, "env_steps": 479846399, "loss": 0.016447003930807114, "avg_return": 0.3083212077617645, "regret": 0.49193525314331055, "entropy": 0.6937907934188843, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:41:23.379880Z", "loop": 781, "env_steps": 480460799, "loss": 0.01665426604449749, "avg_return": 0.31304535269737244, "regret": 0.49193525314331055, "entropy": 0.6933289170265198, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:41:24.541876Z", "loop": 782, "env_steps": 481075199, "loss": 0.016655772924423218, "avg_return": 0.3121177852153778, "regret": 0.49193525314331055, "entropy": 0.6933740377426147, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:41:25.701824Z", "loop": 783, "env_steps": 481689599, "loss": 0.017043322324752808, "avg_return": 0.31525540351867676, "regret": 0.49193525314331055, "entropy": 0.6938663125038147, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:41:26.863916Z", "loop": 784, "env_steps": 482303999, "loss": 0.017747534438967705, "avg_return": 0.3167009949684143, "regret": 0.49193525314331055, "entropy": 0.6943760514259338, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:41:28.069424Z", "loop": 785, "env_steps": 482918399, "loss": 0.01663670502603054, "avg_return": 0.3158207833766937, "regret": 0.4917013943195343, "entropy": 0.6945016384124756, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:41:29.234436Z", "loop": 786, "env_steps": 483532799, "loss": 0.016795534640550613, "avg_return": 0.30998849868774414, "regret": 0.4917013943195343, "entropy": 0.694534957408905, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:41:30.393385Z", "loop": 787, "env_steps": 484147199, "loss": 0.015761379152536392, "avg_return": 0.3100724220275879, "regret": 0.4917013943195343, "entropy": 0.6946300268173218, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:41:31.553856Z", "loop": 788, "env_steps": 484761599, "loss": 0.01860818639397621, "avg_return": 0.31634655594825745, "regret": 0.4917013943195343, "entropy": 0.6946388483047485, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:41:32.712962Z", "loop": 789, "env_steps": 485375999, "loss": 0.016443291679024696, "avg_return": 0.31224530935287476, "regret": 0.4917013943195343, "entropy": 0.6946476101875305, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:41:33.924266Z", "loop": 790, "env_steps": 485990399, "loss": 0.016444506123661995, "avg_return": 0.3045143783092499, "regret": 0.4916314482688904, "entropy": 0.6946486234664917, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:41:35.086523Z", "loop": 791, "env_steps": 486604799, "loss": 0.01578342728316784, "avg_return": 0.30872228741645813, "regret": 0.4916314482688904, "entropy": 0.6945765614509583, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:41:36.248205Z", "loop": 792, "env_steps": 487219199, "loss": 0.0159351397305727, "avg_return": 0.3099408745765686, "regret": 0.4916314482688904, "entropy": 0.6946068406105042, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:41:37.409514Z", "loop": 793, "env_steps": 487833599, "loss": 0.016843309625983238, "avg_return": 0.3122778534889221, "regret": 0.4916314482688904, "entropy": 0.6947231888771057, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:41:38.570800Z", "loop": 794, "env_steps": 488447999, "loss": 0.016099266707897186, "avg_return": 0.31247246265411377, "regret": 0.4916314482688904, "entropy": 0.6947442293167114, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:41:39.776470Z", "loop": 795, "env_steps": 489062399, "loss": 0.016238383948802948, "avg_return": 0.3128757178783417, "regret": 0.4915851056575775, "entropy": 0.6947243213653564, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:41:40.936964Z", "loop": 796, "env_steps": 489676799, "loss": 0.016149329021573067, "avg_return": 0.31334757804870605, "regret": 0.4915851056575775, "entropy": 0.6946440935134888, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:41:42.096057Z", "loop": 797, "env_steps": 490291199, "loss": 0.0167236290872097, "avg_return": 0.31228795647621155, "regret": 0.4915851056575775, "entropy": 0.6946737170219421, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:41:43.255840Z", "loop": 798, "env_steps": 490905599, "loss": 0.016722621396183968, "avg_return": 0.31759852170944214, "regret": 0.4915851056575775, "entropy": 0.694753110408783, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:41:44.415473Z", "loop": 799, "env_steps": 491519999, "loss": 0.01640348508954048, "avg_return": 0.3063942492008209, "regret": 0.4915851056575775, "entropy": 0.6946994066238403, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:41:45.618365Z", "loop": 800, "env_steps": 492134399, "loss": 0.016309494152665138, "avg_return": 0.3090183734893799, "regret": 0.49158045649528503, "entropy": 0.6946159601211548, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:41:46.778848Z", "loop": 801, "env_steps": 492748799, "loss": 0.016860555857419968, "avg_return": 0.3087974488735199, "regret": 0.49158045649528503, "entropy": 0.6946254372596741, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:41:47.939388Z", "loop": 802, "env_steps": 493363199, "loss": 0.015920836478471756, "avg_return": 0.3149920701980591, "regret": 0.49158045649528503, "entropy": 0.6947160959243774, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:41:49.097816Z", "loop": 803, "env_steps": 493977599, "loss": 0.015839923173189163, "avg_return": 0.3119216561317444, "regret": 0.49158045649528503, "entropy": 0.6947886347770691, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:41:50.257805Z", "loop": 804, "env_steps": 494591999, "loss": 0.015902919694781303, "avg_return": 0.3143095374107361, "regret": 0.49158045649528503, "entropy": 0.6947823166847229, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:41:51.458663Z", "loop": 805, "env_steps": 495206399, "loss": 0.016385627910494804, "avg_return": 0.31293076276779175, "regret": 0.49143117666244507, "entropy": 0.694748044013977, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:41:52.619278Z", "loop": 806, "env_steps": 495820799, "loss": 0.016025489196181297, "avg_return": 0.30420374870300293, "regret": 0.49143117666244507, "entropy": 0.6947145462036133, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:41:53.781581Z", "loop": 807, "env_steps": 496435199, "loss": 0.016239486634731293, "avg_return": 0.3133644461631775, "regret": 0.49143117666244507, "entropy": 0.6946046352386475, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:41:54.940873Z", "loop": 808, "env_steps": 497049599, "loss": 0.016744213178753853, "avg_return": 0.3087112009525299, "regret": 0.49143117666244507, "entropy": 0.6945458054542542, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:41:56.102898Z", "loop": 809, "env_steps": 497663999, "loss": 0.015787942335009575, "avg_return": 0.3096415400505066, "regret": 0.49143117666244507, "entropy": 0.6944446563720703, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:41:57.307462Z", "loop": 810, "env_steps": 498278399, "loss": 0.016475027427077293, "avg_return": 0.31438079476356506, "regret": 0.4914771318435669, "entropy": 0.6942739486694336, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:41:58.466679Z", "loop": 811, "env_steps": 498892799, "loss": 0.015994776040315628, "avg_return": 0.31333762407302856, "regret": 0.4914771318435669, "entropy": 0.694077730178833, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:41:59.627690Z", "loop": 812, "env_steps": 499507199, "loss": 0.01744040660560131, "avg_return": 0.31886565685272217, "regret": 0.4914771318435669, "entropy": 0.6943110227584839, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:42:00.787292Z", "loop": 813, "env_steps": 500121599, "loss": 0.017468256875872612, "avg_return": 0.3115675449371338, "regret": 0.4914771318435669, "entropy": 0.6944141983985901, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:42:01.946656Z", "loop": 814, "env_steps": 500735999, "loss": 0.017085285857319832, "avg_return": 0.31006282567977905, "regret": 0.4914771318435669, "entropy": 0.6944929957389832, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:42:03.152503Z", "loop": 815, "env_steps": 501350399, "loss": 0.015618576668202877, "avg_return": 0.3120822012424469, "regret": 0.49142423272132874, "entropy": 0.6938799023628235, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:42:04.313861Z", "loop": 816, "env_steps": 501964799, "loss": 0.016343673691153526, "avg_return": 0.31302013993263245, "regret": 0.49142423272132874, "entropy": 0.6924827694892883, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:42:05.473403Z", "loop": 817, "env_steps": 502579199, "loss": 0.016209058463573456, "avg_return": 0.3110424876213074, "regret": 0.49142423272132874, "entropy": 0.6912261247634888, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:42:06.634534Z", "loop": 818, "env_steps": 503193599, "loss": 0.016596348956227303, "avg_return": 0.3161396384239197, "regret": 0.49142423272132874, "entropy": 0.6903977394104004, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:42:07.793988Z", "loop": 819, "env_steps": 503807999, "loss": 0.016293926164507866, "avg_return": 0.30917760729789734, "regret": 0.49142423272132874, "entropy": 0.6894811391830444, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:42:08.996823Z", "loop": 820, "env_steps": 504422399, "loss": 0.015123516321182251, "avg_return": 0.31017276644706726, "regret": 0.4922562539577484, "entropy": 0.6906020641326904, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:42:10.157503Z", "loop": 821, "env_steps": 505036799, "loss": 0.01598222367465496, "avg_return": 0.3165648877620697, "regret": 0.4922562539577484, "entropy": 0.6915189623832703, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:42:11.318111Z", "loop": 822, "env_steps": 505651199, "loss": 0.016375483945012093, "avg_return": 0.31241583824157715, "regret": 0.4922562539577484, "entropy": 0.6921555995941162, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:42:12.480683Z", "loop": 823, "env_steps": 506265599, "loss": 0.01723499409854412, "avg_return": 0.3135128617286682, "regret": 0.4922562539577484, "entropy": 0.6929327249526978, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:42:13.639874Z", "loop": 824, "env_steps": 506879999, "loss": 0.016030361875891685, "avg_return": 0.31099840998649597, "regret": 0.4922562539577484, "entropy": 0.6932437419891357, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:42:14.841754Z", "loop": 825, "env_steps": 507494399, "loss": 0.0150365075096488, "avg_return": 0.31206563115119934, "regret": 0.49138039350509644, "entropy": 0.693284809589386, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:42:16.002407Z", "loop": 826, "env_steps": 508108799, "loss": 0.016164902597665787, "avg_return": 0.3109848201274872, "regret": 0.49138039350509644, "entropy": 0.6938109397888184, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:42:17.165512Z", "loop": 827, "env_steps": 508723199, "loss": 0.017171353101730347, "avg_return": 0.3135826587677002, "regret": 0.49138039350509644, "entropy": 0.6944253444671631, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:42:18.325728Z", "loop": 828, "env_steps": 509337599, "loss": 0.017312468960881233, "avg_return": 0.31371966004371643, "regret": 0.49138039350509644, "entropy": 0.6939816474914551, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:42:19.484743Z", "loop": 829, "env_steps": 509951999, "loss": 0.016882045194506645, "avg_return": 0.3053002953529358, "regret": 0.49138039350509644, "entropy": 0.692371666431427, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:42:20.688041Z", "loop": 830, "env_steps": 510566399, "loss": 0.016186479479074478, "avg_return": 0.3135989308357239, "regret": 0.49238044023513794, "entropy": 0.6904885768890381, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:42:21.850598Z", "loop": 831, "env_steps": 511180799, "loss": 0.016434621065855026, "avg_return": 0.31027382612228394, "regret": 0.49238044023513794, "entropy": 0.6895027756690979, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:42:23.016911Z", "loop": 832, "env_steps": 511795199, "loss": 0.0157935731112957, "avg_return": 0.3096449673175812, "regret": 0.49238044023513794, "entropy": 0.6913055777549744, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:42:24.177476Z", "loop": 833, "env_steps": 512409599, "loss": 0.017275312915444374, "avg_return": 0.3146820068359375, "regret": 0.49238044023513794, "entropy": 0.6928282976150513, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:42:25.336972Z", "loop": 834, "env_steps": 513023999, "loss": 0.015929849818348885, "avg_return": 0.3085876405239105, "regret": 0.49238044023513794, "entropy": 0.6940309405326843, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:42:26.544589Z", "loop": 835, "env_steps": 513638399, "loss": 0.016062531620264053, "avg_return": 0.31608134508132935, "regret": 0.49089258909225464, "entropy": 0.6943368911743164, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:42:27.705182Z", "loop": 836, "env_steps": 514252799, "loss": 0.017771074548363686, "avg_return": 0.31711050868034363, "regret": 0.49089258909225464, "entropy": 0.6937460899353027, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:42:28.866257Z", "loop": 837, "env_steps": 514867199, "loss": 0.015380344353616238, "avg_return": 0.30772146582603455, "regret": 0.49089258909225464, "entropy": 0.692218005657196, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:42:30.025886Z", "loop": 838, "env_steps": 515481599, "loss": 0.015243072994053364, "avg_return": 0.31000223755836487, "regret": 0.49089258909225464, "entropy": 0.6913160681724548, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:42:31.185825Z", "loop": 839, "env_steps": 516095999, "loss": 0.01608223281800747, "avg_return": 0.308373361825943, "regret": 0.49089258909225464, "entropy": 0.6910849809646606, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:42:32.386675Z", "loop": 840, "env_steps": 516710399, "loss": 0.017313947901129723, "avg_return": 0.3128085732460022, "regret": 0.49147820472717285, "entropy": 0.6916135549545288, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:42:33.547267Z", "loop": 841, "env_steps": 517324799, "loss": 0.01636415533721447, "avg_return": 0.3131389021873474, "regret": 0.49147820472717285, "entropy": 0.6923917531967163, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:42:34.706188Z", "loop": 842, "env_steps": 517939199, "loss": 0.01624622754752636, "avg_return": 0.31508105993270874, "regret": 0.49147820472717285, "entropy": 0.6936361789703369, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:42:35.867329Z", "loop": 843, "env_steps": 518553599, "loss": 0.015195230022072792, "avg_return": 0.3094850778579712, "regret": 0.49147820472717285, "entropy": 0.6941941976547241, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:42:37.027551Z", "loop": 844, "env_steps": 519167999, "loss": 0.01631977967917919, "avg_return": 0.30732524394989014, "regret": 0.49147820472717285, "entropy": 0.6941080689430237, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:42:38.231544Z", "loop": 845, "env_steps": 519782399, "loss": 0.016817759722471237, "avg_return": 0.3152097761631012, "regret": 0.49078017473220825, "entropy": 0.6939122676849365, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:42:39.392922Z", "loop": 846, "env_steps": 520396799, "loss": 0.01630990579724312, "avg_return": 0.3179946839809418, "regret": 0.49078017473220825, "entropy": 0.6934516429901123, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:42:40.554515Z", "loop": 847, "env_steps": 521011199, "loss": 0.016741013154387474, "avg_return": 0.31593552231788635, "regret": 0.49078017473220825, "entropy": 0.6921366453170776, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:42:41.714449Z", "loop": 848, "env_steps": 521625599, "loss": 0.0160395298153162, "avg_return": 0.3061154782772064, "regret": 0.49078017473220825, "entropy": 0.6910766959190369, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:42:42.874540Z", "loop": 849, "env_steps": 522239999, "loss": 0.01628720760345459, "avg_return": 0.3102532923221588, "regret": 0.49078017473220825, "entropy": 0.6897176504135132, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:42:44.075067Z", "loop": 850, "env_steps": 522854399, "loss": 0.015699544921517372, "avg_return": 0.31286463141441345, "regret": 0.49176132678985596, "entropy": 0.6902530789375305, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:42:45.236540Z", "loop": 851, "env_steps": 523468799, "loss": 0.016030428931117058, "avg_return": 0.3153018653392792, "regret": 0.49176132678985596, "entropy": 0.6920755505561829, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:42:46.395951Z", "loop": 852, "env_steps": 524083199, "loss": 0.017284629866480827, "avg_return": 0.31485575437545776, "regret": 0.49176132678985596, "entropy": 0.6937148571014404, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:42:47.556081Z", "loop": 853, "env_steps": 524697599, "loss": 0.01524113304913044, "avg_return": 0.3145616352558136, "regret": 0.49176132678985596, "entropy": 0.6938437223434448, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:42:48.715261Z", "loop": 854, "env_steps": 525311999, "loss": 0.01620936580002308, "avg_return": 0.31571823358535767, "regret": 0.49176132678985596, "entropy": 0.6911899447441101, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:42:49.916291Z", "loop": 855, "env_steps": 525926399, "loss": 0.0163596011698246, "avg_return": 0.31281590461730957, "regret": 0.4916321933269501, "entropy": 0.689637303352356, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:42:51.077002Z", "loop": 856, "env_steps": 526540799, "loss": 0.015770524740219116, "avg_return": 0.3115922808647156, "regret": 0.4916321933269501, "entropy": 0.6888439059257507, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:42:52.238522Z", "loop": 857, "env_steps": 527155199, "loss": 0.015830157324671745, "avg_return": 0.3110295832157135, "regret": 0.4916321933269501, "entropy": 0.690123975276947, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:42:53.398369Z", "loop": 858, "env_steps": 527769599, "loss": 0.015788255259394646, "avg_return": 0.3150944709777832, "regret": 0.4916321933269501, "entropy": 0.6927652359008789, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:42:54.558544Z", "loop": 859, "env_steps": 528383999, "loss": 0.01600843481719494, "avg_return": 0.3128862679004669, "regret": 0.4916321933269501, "entropy": 0.6941803097724915, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:42:55.761255Z", "loop": 860, "env_steps": 528998399, "loss": 0.016377871856093407, "avg_return": 0.3121110498905182, "regret": 0.49038925766944885, "entropy": 0.6939855217933655, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:42:56.923230Z", "loop": 861, "env_steps": 529612799, "loss": 0.016947263851761818, "avg_return": 0.31665539741516113, "regret": 0.49038925766944885, "entropy": 0.6932814121246338, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:42:58.083268Z", "loop": 862, "env_steps": 530227199, "loss": 0.017040608450770378, "avg_return": 0.31409209966659546, "regret": 0.49038925766944885, "entropy": 0.6926652193069458, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:42:59.246498Z", "loop": 863, "env_steps": 530841599, "loss": 0.014875384047627449, "avg_return": 0.31087276339530945, "regret": 0.49038925766944885, "entropy": 0.6919164657592773, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:43:00.407830Z", "loop": 864, "env_steps": 531455999, "loss": 0.015078931115567684, "avg_return": 0.31264200806617737, "regret": 0.49038925766944885, "entropy": 0.6920180320739746, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:43:01.609884Z", "loop": 865, "env_steps": 532070399, "loss": 0.016346191987395287, "avg_return": 0.30926087498664856, "regret": 0.490709125995636, "entropy": 0.6926802396774292, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:43:02.773709Z", "loop": 866, "env_steps": 532684799, "loss": 0.015073493123054504, "avg_return": 0.31012314558029175, "regret": 0.490709125995636, "entropy": 0.6937218308448792, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:43:03.936166Z", "loop": 867, "env_steps": 533299199, "loss": 0.016852226108312607, "avg_return": 0.31526419520378113, "regret": 0.490709125995636, "entropy": 0.6942301988601685, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:43:05.097152Z", "loop": 868, "env_steps": 533913599, "loss": 0.015932170674204826, "avg_return": 0.3113660216331482, "regret": 0.490709125995636, "entropy": 0.6942426562309265, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:43:06.257536Z", "loop": 869, "env_steps": 534527999, "loss": 0.0158530380576849, "avg_return": 0.31376251578330994, "regret": 0.490709125995636, "entropy": 0.6940949559211731, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:43:07.463897Z", "loop": 870, "env_steps": 535142399, "loss": 0.01620502769947052, "avg_return": 0.30859026312828064, "regret": 0.4900114834308624, "entropy": 0.6939771175384521, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:43:08.626626Z", "loop": 871, "env_steps": 535756799, "loss": 0.016312843188643456, "avg_return": 0.315432608127594, "regret": 0.4900114834308624, "entropy": 0.6939569711685181, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:43:09.787493Z", "loop": 872, "env_steps": 536371199, "loss": 0.015036122873425484, "avg_return": 0.30920788645744324, "regret": 0.4900114834308624, "entropy": 0.6940205097198486, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:43:10.948617Z", "loop": 873, "env_steps": 536985599, "loss": 0.01705658808350563, "avg_return": 0.3178648054599762, "regret": 0.4900114834308624, "entropy": 0.6940872669219971, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:43:12.110797Z", "loop": 874, "env_steps": 537599999, "loss": 0.015930427238345146, "avg_return": 0.3192102015018463, "regret": 0.4900114834308624, "entropy": 0.6941269636154175, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:43:13.315974Z", "loop": 875, "env_steps": 538214399, "loss": 0.016674788668751717, "avg_return": 0.3120782971382141, "regret": 0.4897271692752838, "entropy": 0.6940807104110718, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:43:14.477153Z", "loop": 876, "env_steps": 538828799, "loss": 0.01695147715508938, "avg_return": 0.3165324926376343, "regret": 0.4897271692752838, "entropy": 0.6939736008644104, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:43:15.638554Z", "loop": 877, "env_steps": 539443199, "loss": 0.016130497679114342, "avg_return": 0.3133483827114105, "regret": 0.4897271692752838, "entropy": 0.6939441561698914, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:43:16.800297Z", "loop": 878, "env_steps": 540057599, "loss": 0.015778671950101852, "avg_return": 0.3136484920978546, "regret": 0.4897271692752838, "entropy": 0.6939307451248169, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:43:17.961422Z", "loop": 879, "env_steps": 540671999, "loss": 0.01561195682734251, "avg_return": 0.3135592043399811, "regret": 0.4897271692752838, "entropy": 0.6939326524734497, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:43:19.174011Z", "loop": 880, "env_steps": 541286399, "loss": 0.016423344612121582, "avg_return": 0.3196044862270355, "regret": 0.4894571006298065, "entropy": 0.693801760673523, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:43:20.332565Z", "loop": 881, "env_steps": 541900799, "loss": 0.01654745265841484, "avg_return": 0.31861868500709534, "regret": 0.4894571006298065, "entropy": 0.6935743689537048, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:43:21.492953Z", "loop": 882, "env_steps": 542515199, "loss": 0.016107523813843727, "avg_return": 0.31266191601753235, "regret": 0.4894571006298065, "entropy": 0.693317174911499, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:43:22.651731Z", "loop": 883, "env_steps": 543129599, "loss": 0.01634187065064907, "avg_return": 0.314209520816803, "regret": 0.4894571006298065, "entropy": 0.6928895115852356, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:43:23.810993Z", "loop": 884, "env_steps": 543743999, "loss": 0.01601947844028473, "avg_return": 0.31140029430389404, "regret": 0.4894571006298065, "entropy": 0.6930175423622131, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:43:25.011598Z", "loop": 885, "env_steps": 544358399, "loss": 0.01592082343995571, "avg_return": 0.3183549642562866, "regret": 0.4893028736114502, "entropy": 0.692997395992279, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:43:26.173306Z", "loop": 886, "env_steps": 544972799, "loss": 0.01597627066075802, "avg_return": 0.31040260195732117, "regret": 0.4893028736114502, "entropy": 0.6930220723152161, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:43:27.333299Z", "loop": 887, "env_steps": 545587199, "loss": 0.015944773331284523, "avg_return": 0.3106345534324646, "regret": 0.4893028736114502, "entropy": 0.6934833526611328, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:43:28.494393Z", "loop": 888, "env_steps": 546201599, "loss": 0.014955609105527401, "avg_return": 0.3082420825958252, "regret": 0.4893028736114502, "entropy": 0.693499743938446, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:43:29.654714Z", "loop": 889, "env_steps": 546815999, "loss": 0.01570359244942665, "avg_return": 0.3049461543560028, "regret": 0.4893028736114502, "entropy": 0.6926839351654053, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:43:30.858414Z", "loop": 890, "env_steps": 547430399, "loss": 0.01720026321709156, "avg_return": 0.3232713043689728, "regret": 0.4894722104072571, "entropy": 0.6914527416229248, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:43:32.021156Z", "loop": 891, "env_steps": 548044799, "loss": 0.015109335072338581, "avg_return": 0.3137451708316803, "regret": 0.4894722104072571, "entropy": 0.6903359293937683, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:43:33.180790Z", "loop": 892, "env_steps": 548659199, "loss": 0.017253076657652855, "avg_return": 0.3104681968688965, "regret": 0.4894722104072571, "entropy": 0.6903859972953796, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:43:34.339839Z", "loop": 893, "env_steps": 549273599, "loss": 0.015597062185406685, "avg_return": 0.3097439110279083, "regret": 0.4894722104072571, "entropy": 0.6919751167297363, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:43:35.501726Z", "loop": 894, "env_steps": 549887999, "loss": 0.016105487942695618, "avg_return": 0.3174596130847931, "regret": 0.4894722104072571, "entropy": 0.6928588151931763, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:43:36.707521Z", "loop": 895, "env_steps": 550502399, "loss": 0.016390115022659302, "avg_return": 0.3121413290500641, "regret": 0.4884205758571625, "entropy": 0.6929414868354797, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:43:37.867625Z", "loop": 896, "env_steps": 551116799, "loss": 0.015670130029320717, "avg_return": 0.31383320689201355, "regret": 0.4884205758571625, "entropy": 0.6919170022010803, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:43:39.027025Z", "loop": 897, "env_steps": 551731199, "loss": 0.016322743147611618, "avg_return": 0.3175717294216156, "regret": 0.4884205758571625, "entropy": 0.6905830502510071, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:43:40.186696Z", "loop": 898, "env_steps": 552345599, "loss": 0.016264090314507484, "avg_return": 0.3193129301071167, "regret": 0.4884205758571625, "entropy": 0.6895902156829834, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:43:41.346351Z", "loop": 899, "env_steps": 552959999, "loss": 0.015219743363559246, "avg_return": 0.3159011900424957, "regret": 0.4884205758571625, "entropy": 0.6913615465164185, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:43:42.549145Z", "loop": 900, "env_steps": 553574399, "loss": 0.015752596780657768, "avg_return": 0.3231858015060425, "regret": 0.4880785048007965, "entropy": 0.6923562288284302, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:43:43.709922Z", "loop": 901, "env_steps": 554188799, "loss": 0.016681494191288948, "avg_return": 0.3162074685096741, "regret": 0.4880785048007965, "entropy": 0.6924575567245483, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:43:44.869863Z", "loop": 902, "env_steps": 554803199, "loss": 0.017370324581861496, "avg_return": 0.3226473033428192, "regret": 0.4880785048007965, "entropy": 0.6905238032341003, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:43:46.029382Z", "loop": 903, "env_steps": 555417599, "loss": 0.01643242873251438, "avg_return": 0.31454962491989136, "regret": 0.4880785048007965, "entropy": 0.687949538230896, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:43:47.188836Z", "loop": 904, "env_steps": 556031999, "loss": 0.01644766889512539, "avg_return": 0.3114279508590698, "regret": 0.4880785048007965, "entropy": 0.6872161030769348, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:43:48.388044Z", "loop": 905, "env_steps": 556646399, "loss": 0.016240010038018227, "avg_return": 0.3234938085079193, "regret": 0.48855847120285034, "entropy": 0.6896389126777649, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:43:49.548738Z", "loop": 906, "env_steps": 557260799, "loss": 0.01544217485934496, "avg_return": 0.3172663450241089, "regret": 0.48855847120285034, "entropy": 0.691540539264679, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:43:50.708269Z", "loop": 907, "env_steps": 557875199, "loss": 0.016611209139227867, "avg_return": 0.3210599422454834, "regret": 0.48855847120285034, "entropy": 0.6921213269233704, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:43:51.875787Z", "loop": 908, "env_steps": 558489599, "loss": 0.01581726223230362, "avg_return": 0.3166959583759308, "regret": 0.48855847120285034, "entropy": 0.6922020316123962, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:43:53.034034Z", "loop": 909, "env_steps": 559103999, "loss": 0.016541574150323868, "avg_return": 0.32316672801971436, "regret": 0.48855847120285034, "entropy": 0.6919682025909424, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:43:54.236524Z", "loop": 910, "env_steps": 559718399, "loss": 0.015931006520986557, "avg_return": 0.3195798695087433, "regret": 0.4870508313179016, "entropy": 0.6918490529060364, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:43:55.397617Z", "loop": 911, "env_steps": 560332799, "loss": 0.016364512965083122, "avg_return": 0.3194372057914734, "regret": 0.4870508313179016, "entropy": 0.6916740536689758, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:43:56.556657Z", "loop": 912, "env_steps": 560947199, "loss": 0.01563110202550888, "avg_return": 0.3241613805294037, "regret": 0.4870508313179016, "entropy": 0.6919218301773071, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:43:57.715033Z", "loop": 913, "env_steps": 561561599, "loss": 0.016441458836197853, "avg_return": 0.3228374421596527, "regret": 0.4870508313179016, "entropy": 0.6919017434120178, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:43:58.875848Z", "loop": 914, "env_steps": 562175999, "loss": 0.016857974231243134, "avg_return": 0.3130461573600769, "regret": 0.4870508313179016, "entropy": 0.6916806697845459, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:44:00.079029Z", "loop": 915, "env_steps": 562790399, "loss": 0.01643732748925686, "avg_return": 0.3131776750087738, "regret": 0.4863830804824829, "entropy": 0.6915771961212158, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:44:01.239769Z", "loop": 916, "env_steps": 563404799, "loss": 0.015399808995425701, "avg_return": 0.3186134696006775, "regret": 0.4863830804824829, "entropy": 0.6914964318275452, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:44:02.399377Z", "loop": 917, "env_steps": 564019199, "loss": 0.015921154990792274, "avg_return": 0.31782591342926025, "regret": 0.4863830804824829, "entropy": 0.6914936304092407, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:44:03.558864Z", "loop": 918, "env_steps": 564633599, "loss": 0.014483054168522358, "avg_return": 0.3143954277038574, "regret": 0.4863830804824829, "entropy": 0.6912999153137207, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:44:04.718207Z", "loop": 919, "env_steps": 565247999, "loss": 0.016503119841217995, "avg_return": 0.3194996118545532, "regret": 0.4863830804824829, "entropy": 0.6905922889709473, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:44:05.920771Z", "loop": 920, "env_steps": 565862399, "loss": 0.015603169798851013, "avg_return": 0.3204997479915619, "regret": 0.4856160283088684, "entropy": 0.6905682682991028, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:44:07.081945Z", "loop": 921, "env_steps": 566476799, "loss": 0.015621915459632874, "avg_return": 0.3217044174671173, "regret": 0.4856160283088684, "entropy": 0.6904043555259705, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:44:08.243214Z", "loop": 922, "env_steps": 567091199, "loss": 0.016592904925346375, "avg_return": 0.3192152976989746, "regret": 0.4856160283088684, "entropy": 0.6902362704277039, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:44:09.403053Z", "loop": 923, "env_steps": 567705599, "loss": 0.01575685851275921, "avg_return": 0.3181220591068268, "regret": 0.4856160283088684, "entropy": 0.690585196018219, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:44:10.563569Z", "loop": 924, "env_steps": 568319999, "loss": 0.016600554808974266, "avg_return": 0.3162451386451721, "regret": 0.4856160283088684, "entropy": 0.6901724934577942, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:44:11.765534Z", "loop": 925, "env_steps": 568934399, "loss": 0.015639958903193474, "avg_return": 0.3142707049846649, "regret": 0.4846610724925995, "entropy": 0.6897192001342773, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:44:12.927901Z", "loop": 926, "env_steps": 569548799, "loss": 0.015779446810483932, "avg_return": 0.32035642862319946, "regret": 0.4846610724925995, "entropy": 0.68985915184021, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:44:14.087582Z", "loop": 927, "env_steps": 570163199, "loss": 0.015812687575817108, "avg_return": 0.3281114399433136, "regret": 0.4846610724925995, "entropy": 0.6887822151184082, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:44:15.249553Z", "loop": 928, "env_steps": 570777599, "loss": 0.01589936576783657, "avg_return": 0.3220447301864624, "regret": 0.4846610724925995, "entropy": 0.6863887906074524, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:44:16.409007Z", "loop": 929, "env_steps": 571391999, "loss": 0.016759900376200676, "avg_return": 0.3215019702911377, "regret": 0.4846610724925995, "entropy": 0.6846956014633179, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:44:17.621490Z", "loop": 930, "env_steps": 572006399, "loss": 0.015337000600993633, "avg_return": 0.32088953256607056, "regret": 0.4843156337738037, "entropy": 0.6838353872299194, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:44:18.782918Z", "loop": 931, "env_steps": 572620799, "loss": 0.01565869338810444, "avg_return": 0.3224954903125763, "regret": 0.4843156337738037, "entropy": 0.685683012008667, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:44:19.943687Z", "loop": 932, "env_steps": 573235199, "loss": 0.014931345358490944, "avg_return": 0.3157500922679901, "regret": 0.4843156337738037, "entropy": 0.6869347095489502, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:44:21.103027Z", "loop": 933, "env_steps": 573849599, "loss": 0.015601572580635548, "avg_return": 0.3173973262310028, "regret": 0.4843156337738037, "entropy": 0.6877779960632324, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:44:22.262445Z", "loop": 934, "env_steps": 574463999, "loss": 0.014327301643788815, "avg_return": 0.31895220279693604, "regret": 0.4843156337738037, "entropy": 0.6863532066345215, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:44:23.468973Z", "loop": 935, "env_steps": 575078399, "loss": 0.01487811841070652, "avg_return": 0.3250593841075897, "regret": 0.4825998842716217, "entropy": 0.6849662065505981, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:44:24.629943Z", "loop": 936, "env_steps": 575692799, "loss": 0.015808258205652237, "avg_return": 0.3267747461795807, "regret": 0.4825998842716217, "entropy": 0.6844940781593323, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:44:25.789336Z", "loop": 937, "env_steps": 576307199, "loss": 0.015424223616719246, "avg_return": 0.325652152299881, "regret": 0.4825998842716217, "entropy": 0.6844833493232727, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:44:26.948189Z", "loop": 938, "env_steps": 576921599, "loss": 0.01540250051766634, "avg_return": 0.3218385875225067, "regret": 0.4825998842716217, "entropy": 0.6846591234207153, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:44:28.109240Z", "loop": 939, "env_steps": 577535999, "loss": 0.014323070645332336, "avg_return": 0.3174492120742798, "regret": 0.4825998842716217, "entropy": 0.6851485967636108, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:44:29.312743Z", "loop": 940, "env_steps": 578150399, "loss": 0.01517259981483221, "avg_return": 0.3206583857536316, "regret": 0.48093682527542114, "entropy": 0.6812913417816162, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:44:30.472305Z", "loop": 941, "env_steps": 578764799, "loss": 0.01461103092879057, "avg_return": 0.3206724524497986, "regret": 0.48093682527542114, "entropy": 0.679838240146637, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:44:31.632628Z", "loop": 942, "env_steps": 579379199, "loss": 0.01469466369599104, "avg_return": 0.3291262090206146, "regret": 0.48093682527542114, "entropy": 0.6822360754013062, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:44:32.791872Z", "loop": 943, "env_steps": 579993599, "loss": 0.014313573017716408, "avg_return": 0.32459133863449097, "regret": 0.48093682527542114, "entropy": 0.6833717823028564, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:44:33.951984Z", "loop": 944, "env_steps": 580607999, "loss": 0.01399791520088911, "avg_return": 0.3270324766635895, "regret": 0.48093682527542114, "entropy": 0.6818158030509949, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:44:35.155352Z", "loop": 945, "env_steps": 581222399, "loss": 0.015972057357430458, "avg_return": 0.33029744029045105, "regret": 0.4785284698009491, "entropy": 0.6802836060523987, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:44:36.315278Z", "loop": 946, "env_steps": 581836799, "loss": 0.015966443344950676, "avg_return": 0.3280610144138336, "regret": 0.4785284698009491, "entropy": 0.6800982356071472, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:44:37.474013Z", "loop": 947, "env_steps": 582451199, "loss": 0.01424830686300993, "avg_return": 0.32420921325683594, "regret": 0.4785284698009491, "entropy": 0.6766945719718933, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:44:38.633882Z", "loop": 948, "env_steps": 583065599, "loss": 0.01491140853613615, "avg_return": 0.3266979157924652, "regret": 0.4785284698009491, "entropy": 0.6753756999969482, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:44:39.795158Z", "loop": 949, "env_steps": 583679999, "loss": 0.013356317766010761, "avg_return": 0.31670689582824707, "regret": 0.4785284698009491, "entropy": 0.6760948300361633, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:44:40.998731Z", "loop": 950, "env_steps": 584294399, "loss": 0.014392654411494732, "avg_return": 0.3268789052963257, "regret": 0.4761722683906555, "entropy": 0.6773893237113953, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:44:42.157062Z", "loop": 951, "env_steps": 584908799, "loss": 0.014210358262062073, "avg_return": 0.320295125246048, "regret": 0.4761722683906555, "entropy": 0.6740739345550537, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:44:43.315993Z", "loop": 952, "env_steps": 585523199, "loss": 0.014364597387611866, "avg_return": 0.3300485908985138, "regret": 0.4761722683906555, "entropy": 0.6709110140800476, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:44:44.474284Z", "loop": 953, "env_steps": 586137599, "loss": 0.014227613806724548, "avg_return": 0.32996121048927307, "regret": 0.4761722683906555, "entropy": 0.6724115014076233, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:44:45.633047Z", "loop": 954, "env_steps": 586751999, "loss": 0.014707515947520733, "avg_return": 0.32998672127723694, "regret": 0.4761722683906555, "entropy": 0.6719834804534912, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:44:46.838078Z", "loop": 955, "env_steps": 587366399, "loss": 0.01445256918668747, "avg_return": 0.329141229391098, "regret": 0.47417399287223816, "entropy": 0.6701682209968567, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:44:48.003001Z", "loop": 956, "env_steps": 587980799, "loss": 0.014025035314261913, "avg_return": 0.33080676198005676, "regret": 0.47417399287223816, "entropy": 0.6680786609649658, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:44:49.164786Z", "loop": 957, "env_steps": 588595199, "loss": 0.01384761929512024, "avg_return": 0.3278019428253174, "regret": 0.47417399287223816, "entropy": 0.6644608974456787, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:44:50.325206Z", "loop": 958, "env_steps": 589209599, "loss": 0.012606538832187653, "avg_return": 0.333467572927475, "regret": 0.47417399287223816, "entropy": 0.6647287607192993, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:44:51.485647Z", "loop": 959, "env_steps": 589823999, "loss": 0.01378973014652729, "avg_return": 0.3292404115200043, "regret": 0.47417399287223816, "entropy": 0.6642194390296936, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:44:52.691362Z", "loop": 960, "env_steps": 590438399, "loss": 0.015007728710770607, "avg_return": 0.33557698130607605, "regret": 0.4720844328403473, "entropy": 0.6627183556556702, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:44:53.850905Z", "loop": 961, "env_steps": 591052799, "loss": 0.014131958596408367, "avg_return": 0.32542142271995544, "regret": 0.4720844328403473, "entropy": 0.6464650630950928, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:44:55.010468Z", "loop": 962, "env_steps": 591667199, "loss": 0.013695132918655872, "avg_return": 0.32434529066085815, "regret": 0.4720844328403473, "entropy": 0.6455032825469971, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:44:56.171870Z", "loop": 963, "env_steps": 592281599, "loss": 0.013551036827266216, "avg_return": 0.3364526033401489, "regret": 0.4720844328403473, "entropy": 0.6539703607559204, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:44:57.330441Z", "loop": 964, "env_steps": 592895999, "loss": 0.013815443031489849, "avg_return": 0.3334490656852722, "regret": 0.4720844328403473, "entropy": 0.6532806754112244, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:44:58.534560Z", "loop": 965, "env_steps": 593510399, "loss": 0.01464595552533865, "avg_return": 0.3343122601509094, "regret": 0.4739970564842224, "entropy": 0.6396164298057556, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:44:59.695551Z", "loop": 966, "env_steps": 594124799, "loss": 0.013776910491287708, "avg_return": 0.3346482515335083, "regret": 0.4739970564842224, "entropy": 0.6406345963478088, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:45:00.856120Z", "loop": 967, "env_steps": 594739199, "loss": 0.01381476130336523, "avg_return": 0.34042349457740784, "regret": 0.4739970564842224, "entropy": 0.6485536098480225, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:45:02.015537Z", "loop": 968, "env_steps": 595353599, "loss": 0.01212991587817669, "avg_return": 0.3290826976299286, "regret": 0.4739970564842224, "entropy": 0.6437591910362244, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:45:03.174901Z", "loop": 969, "env_steps": 595967999, "loss": 0.01303594559431076, "avg_return": 0.32632964849472046, "regret": 0.4739970564842224, "entropy": 0.6210271716117859, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:45:04.376193Z", "loop": 970, "env_steps": 596582399, "loss": 0.013510276563465595, "avg_return": 0.3329637944698334, "regret": 0.47491025924682617, "entropy": 0.6101688742637634, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:45:05.536190Z", "loop": 971, "env_steps": 597196799, "loss": 0.012562887743115425, "avg_return": 0.33040255308151245, "regret": 0.47491025924682617, "entropy": 0.6359114646911621, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:45:06.696215Z", "loop": 972, "env_steps": 597811199, "loss": 0.012813225388526917, "avg_return": 0.33930400013923645, "regret": 0.47491025924682617, "entropy": 0.6359438896179199, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:45:07.857496Z", "loop": 973, "env_steps": 598425599, "loss": 0.0127176558598876, "avg_return": 0.3339657783508301, "regret": 0.47491025924682617, "entropy": 0.6158965229988098, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:45:09.016614Z", "loop": 974, "env_steps": 599039999, "loss": 0.012275817804038525, "avg_return": 0.3337862193584442, "regret": 0.47491025924682617, "entropy": 0.6115239858627319, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:45:10.223215Z", "loop": 975, "env_steps": 599654399, "loss": 0.01241527684032917, "avg_return": 0.3408053517341614, "regret": 0.4676229655742645, "entropy": 0.6250988245010376, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:45:11.382902Z", "loop": 976, "env_steps": 600268799, "loss": 0.011779114603996277, "avg_return": 0.3413131833076477, "regret": 0.4676229655742645, "entropy": 0.6292375922203064, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:45:12.543968Z", "loop": 977, "env_steps": 600883199, "loss": 0.012576048262417316, "avg_return": 0.33804118633270264, "regret": 0.4676229655742645, "entropy": 0.6067705750465393, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:45:13.702989Z", "loop": 978, "env_steps": 601497599, "loss": 0.011899953708052635, "avg_return": 0.3247101902961731, "regret": 0.4676229655742645, "entropy": 0.5923361778259277, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:45:14.862466Z", "loop": 979, "env_steps": 602111999, "loss": 0.013164249248802662, "avg_return": 0.33863013982772827, "regret": 0.4676229655742645, "entropy": 0.5871884822845459, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:45:16.067275Z", "loop": 980, "env_steps": 602726399, "loss": 0.01167865376919508, "avg_return": 0.3309822082519531, "regret": 0.4659787118434906, "entropy": 0.6033087968826294, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:45:17.228070Z", "loop": 981, "env_steps": 603340799, "loss": 0.011118079535663128, "avg_return": 0.3425081968307495, "regret": 0.4659787118434906, "entropy": 0.6200905442237854, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:45:18.387915Z", "loop": 982, "env_steps": 603955199, "loss": 0.011964634992182255, "avg_return": 0.33838990330696106, "regret": 0.4659787118434906, "entropy": 0.6166918873786926, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:45:19.549286Z", "loop": 983, "env_steps": 604569599, "loss": 0.01131031196564436, "avg_return": 0.3432779908180237, "regret": 0.4659787118434906, "entropy": 0.6108660697937012, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:45:20.708646Z", "loop": 984, "env_steps": 605183999, "loss": 0.012211970053613186, "avg_return": 0.34630081057548523, "regret": 0.4659787118434906, "entropy": 0.6097956299781799, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:45:21.914204Z", "loop": 985, "env_steps": 605798399, "loss": 0.011156079359352589, "avg_return": 0.3460851013660431, "regret": 0.4626612961292267, "entropy": 0.6092032194137573, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:45:23.074947Z", "loop": 986, "env_steps": 606412799, "loss": 0.011336682364344597, "avg_return": 0.3413548469543457, "regret": 0.4626612961292267, "entropy": 0.6088871359825134, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:45:24.238408Z", "loop": 987, "env_steps": 607027199, "loss": 0.011065863072872162, "avg_return": 0.3418576419353485, "regret": 0.4626612961292267, "entropy": 0.6042870283126831, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:45:25.399271Z", "loop": 988, "env_steps": 607641599, "loss": 0.010520805604755878, "avg_return": 0.33814433217048645, "regret": 0.4626612961292267, "entropy": 0.5986809134483337, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:45:26.560731Z", "loop": 989, "env_steps": 608255999, "loss": 0.01099859457463026, "avg_return": 0.34849661588668823, "regret": 0.4626612961292267, "entropy": 0.5977830290794373, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:45:27.772390Z", "loop": 990, "env_steps": 608870399, "loss": 0.01039999257773161, "avg_return": 0.34240812063217163, "regret": 0.45959967374801636, "entropy": 0.5971423983573914, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:45:28.932410Z", "loop": 991, "env_steps": 609484799, "loss": 0.010038826614618301, "avg_return": 0.3433588147163391, "regret": 0.45959967374801636, "entropy": 0.5926777124404907, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:45:30.090650Z", "loop": 992, "env_steps": 610099199, "loss": 0.010530724190175533, "avg_return": 0.3426474332809448, "regret": 0.45959967374801636, "entropy": 0.5854353904724121, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:45:31.250821Z", "loop": 993, "env_steps": 610713599, "loss": 0.011020858772099018, "avg_return": 0.3495858907699585, "regret": 0.45959967374801636, "entropy": 0.5728597044944763, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:45:32.411168Z", "loop": 994, "env_steps": 611327999, "loss": 0.00963140930980444, "avg_return": 0.33838707208633423, "regret": 0.45959967374801636, "entropy": 0.5666121244430542, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:45:33.616251Z", "loop": 995, "env_steps": 611942399, "loss": 0.010551257990300655, "avg_return": 0.3406601548194885, "regret": 0.45837539434432983, "entropy": 0.5658858418464661, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:45:34.775386Z", "loop": 996, "env_steps": 612556799, "loss": 0.010163386352360249, "avg_return": 0.3438737690448761, "regret": 0.45837539434432983, "entropy": 0.578001856803894, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:45:35.935123Z", "loop": 997, "env_steps": 613171199, "loss": 0.009588542394340038, "avg_return": 0.3433476388454437, "regret": 0.45837539434432983, "entropy": 0.5821807980537415, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:45:37.094835Z", "loop": 998, "env_steps": 613785599, "loss": 0.009443617425858974, "avg_return": 0.34868255257606506, "regret": 0.45837539434432983, "entropy": 0.5770784020423889, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:45:38.254177Z", "loop": 999, "env_steps": 614399999, "loss": 0.010136309079825878, "avg_return": 0.3515753149986267, "regret": 0.45837539434432983, "entropy": 0.5736778378486633, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:45:39.460174Z", "loop": 1000, "env_steps": 615014399, "loss": 0.00994367990642786, "avg_return": 0.3514275550842285, "regret": 0.4565415382385254, "entropy": 0.5744423270225525, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:45:40.621186Z", "loop": 1001, "env_steps": 615628799, "loss": 0.00982324406504631, "avg_return": 0.3466957211494446, "regret": 0.4565415382385254, "entropy": 0.5737901926040649, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:45:41.780895Z", "loop": 1002, "env_steps": 616243199, "loss": 0.010077315382659435, "avg_return": 0.3463505208492279, "regret": 0.4565415382385254, "entropy": 0.5652356743812561, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:45:42.941287Z", "loop": 1003, "env_steps": 616857599, "loss": 0.010479094460606575, "avg_return": 0.34821975231170654, "regret": 0.4565415382385254, "entropy": 0.5622555613517761, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:45:44.101661Z", "loop": 1004, "env_steps": 617471999, "loss": 0.01033193338662386, "avg_return": 0.34898626804351807, "regret": 0.4565415382385254, "entropy": 0.5548098683357239, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:45:45.308544Z", "loop": 1005, "env_steps": 618086399, "loss": 0.009801222942769527, "avg_return": 0.340434730052948, "regret": 0.45595449209213257, "entropy": 0.5590791702270508, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:45:46.468156Z", "loop": 1006, "env_steps": 618700799, "loss": 0.009380003437399864, "avg_return": 0.35631439089775085, "regret": 0.45595449209213257, "entropy": 0.5516668558120728, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:45:47.629061Z", "loop": 1007, "env_steps": 619315199, "loss": 0.009834608994424343, "avg_return": 0.3458101153373718, "regret": 0.45595449209213257, "entropy": 0.5214135646820068, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:45:48.790104Z", "loop": 1008, "env_steps": 619929599, "loss": 0.009892521426081657, "avg_return": 0.3330552279949188, "regret": 0.45595449209213257, "entropy": 0.47825726866722107, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:45:49.949526Z", "loop": 1009, "env_steps": 620543999, "loss": 0.011628758162260056, "avg_return": 0.34050074219703674, "regret": 0.45595449209213257, "entropy": 0.45405930280685425, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:45:51.154864Z", "loop": 1010, "env_steps": 621158399, "loss": 0.010383385233581066, "avg_return": 0.34149032831192017, "regret": 0.45834288001060486, "entropy": 0.48673832416534424, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:45:52.316960Z", "loop": 1011, "env_steps": 621772799, "loss": 0.009118380956351757, "avg_return": 0.3479655086994171, "regret": 0.45834288001060486, "entropy": 0.5210635662078857, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:45:53.481388Z", "loop": 1012, "env_steps": 622387199, "loss": 0.00922961626201868, "avg_return": 0.35344788432121277, "regret": 0.45834288001060486, "entropy": 0.544944703578949, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:45:54.640905Z", "loop": 1013, "env_steps": 623001599, "loss": 0.009660220704972744, "avg_return": 0.34990158677101135, "regret": 0.45834288001060486, "entropy": 0.5370216369628906, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:45:55.800436Z", "loop": 1014, "env_steps": 623615999, "loss": 0.010016633197665215, "avg_return": 0.34741055965423584, "regret": 0.45834288001060486, "entropy": 0.5233337879180908, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:45:57.005315Z", "loop": 1015, "env_steps": 624230399, "loss": 0.011189489625394344, "avg_return": 0.3511478900909424, "regret": 0.4593442678451538, "entropy": 0.5129676461219788, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:45:58.167589Z", "loop": 1016, "env_steps": 624844799, "loss": 0.008773437701165676, "avg_return": 0.3493508994579315, "regret": 0.4593442678451538, "entropy": 0.5282682776451111, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:45:59.326918Z", "loop": 1017, "env_steps": 625459199, "loss": 0.00966730434447527, "avg_return": 0.3540065884590149, "regret": 0.4593442678451538, "entropy": 0.5328881144523621, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:46:00.487409Z", "loop": 1018, "env_steps": 626073599, "loss": 0.009145278483629227, "avg_return": 0.3557632565498352, "regret": 0.4593442678451538, "entropy": 0.5253486037254333, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:46:01.646180Z", "loop": 1019, "env_steps": 626687999, "loss": 0.009558039717376232, "avg_return": 0.35698190331459045, "regret": 0.4593442678451538, "entropy": 0.5002470016479492, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:46:02.853536Z", "loop": 1020, "env_steps": 627302399, "loss": 0.008737431839108467, "avg_return": 0.35559266805648804, "regret": 0.45084819197654724, "entropy": 0.48278388381004333, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:46:04.014305Z", "loop": 1021, "env_steps": 627916799, "loss": 0.008780024014413357, "avg_return": 0.3519861102104187, "regret": 0.45084819197654724, "entropy": 0.4604624807834625, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:46:05.173762Z", "loop": 1022, "env_steps": 628531199, "loss": 0.0087840361520648, "avg_return": 0.3665315508842468, "regret": 0.45084819197654724, "entropy": 0.4797784686088562, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:46:06.332865Z", "loop": 1023, "env_steps": 629145599, "loss": 0.007855617441236973, "avg_return": 0.35236892104148865, "regret": 0.45084819197654724, "entropy": 0.49517080187797546, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:46:07.492420Z", "loop": 1024, "env_steps": 629759999, "loss": 0.009142863564193249, "avg_return": 0.3624947667121887, "regret": 0.45084819197654724, "entropy": 0.5057551860809326, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:46:08.702348Z", "loop": 1025, "env_steps": 630374399, "loss": 0.008328437805175781, "avg_return": 0.35232824087142944, "regret": 0.4493587017059326, "entropy": 0.5065920948982239, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:46:09.863403Z", "loop": 1026, "env_steps": 630988799, "loss": 0.00887046568095684, "avg_return": 0.35156819224357605, "regret": 0.4493587017059326, "entropy": 0.49591052532196045, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:46:11.029263Z", "loop": 1027, "env_steps": 631603199, "loss": 0.008811245672404766, "avg_return": 0.3467065393924713, "regret": 0.4493587017059326, "entropy": 0.4801830053329468, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:46:12.188931Z", "loop": 1028, "env_steps": 632217599, "loss": 0.00868214201182127, "avg_return": 0.3592558801174164, "regret": 0.4493587017059326, "entropy": 0.49779200553894043, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:46:13.353282Z", "loop": 1029, "env_steps": 632831999, "loss": 0.007918932475149632, "avg_return": 0.35482916235923767, "regret": 0.4493587017059326, "entropy": 0.48890578746795654, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:46:14.560420Z", "loop": 1030, "env_steps": 633446399, "loss": 0.008114912547171116, "avg_return": 0.360545814037323, "regret": 0.4460681676864624, "entropy": 0.46217694878578186, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:46:15.720201Z", "loop": 1031, "env_steps": 634060799, "loss": 0.0081822220236063, "avg_return": 0.3545166552066803, "regret": 0.4460681676864624, "entropy": 0.4193703532218933, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:46:16.880270Z", "loop": 1032, "env_steps": 634675199, "loss": 0.008806927129626274, "avg_return": 0.3492240905761719, "regret": 0.4460681676864624, "entropy": 0.3885818123817444, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:46:18.040842Z", "loop": 1033, "env_steps": 635289599, "loss": 0.00895173754543066, "avg_return": 0.3532736897468567, "regret": 0.4460681676864624, "entropy": 0.3859110176563263, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:46:19.200476Z", "loop": 1034, "env_steps": 635903999, "loss": 0.008179876953363419, "avg_return": 0.3566008508205414, "regret": 0.4460681676864624, "entropy": 0.41419997811317444, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:46:20.407550Z", "loop": 1035, "env_steps": 636518399, "loss": 0.008172435685992241, "avg_return": 0.3683232069015503, "regret": 0.4445343315601349, "entropy": 0.44709157943725586, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:46:21.567649Z", "loop": 1036, "env_steps": 637132799, "loss": 0.007396947126835585, "avg_return": 0.3602030277252197, "regret": 0.4445343315601349, "entropy": 0.4826139211654663, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:46:22.727097Z", "loop": 1037, "env_steps": 637747199, "loss": 0.007707925979048014, "avg_return": 0.3617055118083954, "regret": 0.4445343315601349, "entropy": 0.48383283615112305, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:46:23.886877Z", "loop": 1038, "env_steps": 638361599, "loss": 0.008211443200707436, "avg_return": 0.35220733284950256, "regret": 0.4445343315601349, "entropy": 0.4622834324836731, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:46:25.048022Z", "loop": 1039, "env_steps": 638975999, "loss": 0.009477055631577969, "avg_return": 0.34707143902778625, "regret": 0.4445343315601349, "entropy": 0.4489603340625763, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:46:26.255266Z", "loop": 1040, "env_steps": 639590399, "loss": 0.00933556817471981, "avg_return": 0.3522898852825165, "regret": 0.4496612548828125, "entropy": 0.4563441276550293, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:46:27.415999Z", "loop": 1041, "env_steps": 640204799, "loss": 0.00749897351488471, "avg_return": 0.36034372448921204, "regret": 0.4496612548828125, "entropy": 0.4735589027404785, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:46:28.575167Z", "loop": 1042, "env_steps": 640819199, "loss": 0.007484062109142542, "avg_return": 0.35754597187042236, "regret": 0.4496612548828125, "entropy": 0.47331780195236206, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:46:29.737150Z", "loop": 1043, "env_steps": 641433599, "loss": 0.007875650189816952, "avg_return": 0.3662119507789612, "regret": 0.4496612548828125, "entropy": 0.45999857783317566, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:46:30.897486Z", "loop": 1044, "env_steps": 642047999, "loss": 0.007780056446790695, "avg_return": 0.3669314980506897, "regret": 0.4496612548828125, "entropy": 0.398486465215683, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:46:32.102294Z", "loop": 1045, "env_steps": 642662399, "loss": 0.008286981843411922, "avg_return": 0.35218462347984314, "regret": 0.4504495859146118, "entropy": 0.34603604674339294, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:46:33.262090Z", "loop": 1046, "env_steps": 643276799, "loss": 0.008599168621003628, "avg_return": 0.34443971514701843, "regret": 0.4504495859146118, "entropy": 0.3235517740249634, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:46:34.423112Z", "loop": 1047, "env_steps": 643891199, "loss": 0.008857703767716885, "avg_return": 0.3541093170642853, "regret": 0.4504495859146118, "entropy": 0.34045132994651794, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:46:35.585567Z", "loop": 1048, "env_steps": 644505599, "loss": 0.007128923665732145, "avg_return": 0.3587636947631836, "regret": 0.4504495859146118, "entropy": 0.3798682689666748, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:46:36.751189Z", "loop": 1049, "env_steps": 645119999, "loss": 0.007109025027602911, "avg_return": 0.36701905727386475, "regret": 0.4504495859146118, "entropy": 0.4312933683395386, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:46:37.960502Z", "loop": 1050, "env_steps": 645734399, "loss": 0.007042670156806707, "avg_return": 0.3626919686794281, "regret": 0.4399970471858978, "entropy": 0.4565249979496002, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:46:39.121072Z", "loop": 1051, "env_steps": 646348799, "loss": 0.007106255739927292, "avg_return": 0.36419469118118286, "regret": 0.4399970471858978, "entropy": 0.445896178483963, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:46:40.280564Z", "loop": 1052, "env_steps": 646963199, "loss": 0.0075636799447238445, "avg_return": 0.3556848168373108, "regret": 0.4399970471858978, "entropy": 0.4213128089904785, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:46:41.440846Z", "loop": 1053, "env_steps": 647577599, "loss": 0.007564648520201445, "avg_return": 0.35708749294281006, "regret": 0.4399970471858978, "entropy": 0.42673933506011963, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:46:42.602339Z", "loop": 1054, "env_steps": 648191999, "loss": 0.007112462073564529, "avg_return": 0.3600063621997833, "regret": 0.4399970471858978, "entropy": 0.4314771592617035, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:46:43.818117Z", "loop": 1055, "env_steps": 648806399, "loss": 0.006721802055835724, "avg_return": 0.3681522011756897, "regret": 0.43997108936309814, "entropy": 0.4479314386844635, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:46:44.980253Z", "loop": 1056, "env_steps": 649420799, "loss": 0.0065690502524375916, "avg_return": 0.36656561493873596, "regret": 0.43997108936309814, "entropy": 0.4423210322856903, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:46:46.142828Z", "loop": 1057, "env_steps": 650035199, "loss": 0.0064913551323115826, "avg_return": 0.367731511592865, "regret": 0.43997108936309814, "entropy": 0.40742042660713196, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:46:47.304228Z", "loop": 1058, "env_steps": 650649599, "loss": 0.006624785717576742, "avg_return": 0.36240142583847046, "regret": 0.43997108936309814, "entropy": 0.3673771321773529, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:46:48.463519Z", "loop": 1059, "env_steps": 651263999, "loss": 0.006637238897383213, "avg_return": 0.36210593581199646, "regret": 0.43997108936309814, "entropy": 0.33340367674827576, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:46:49.668701Z", "loop": 1060, "env_steps": 651878399, "loss": 0.007820279337465763, "avg_return": 0.3554861545562744, "regret": 0.4466913640499115, "entropy": 0.31081900000572205, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:46:50.828310Z", "loop": 1061, "env_steps": 652492799, "loss": 0.007215541787445545, "avg_return": 0.35622546076774597, "regret": 0.4466913640499115, "entropy": 0.2991940975189209, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:46:51.989655Z", "loop": 1062, "env_steps": 653107199, "loss": 0.007345158141106367, "avg_return": 0.36306682229042053, "regret": 0.4466913640499115, "entropy": 0.3087714910507202, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:46:53.149392Z", "loop": 1063, "env_steps": 653721599, "loss": 0.006770735140889883, "avg_return": 0.3604572117328644, "regret": 0.4466913640499115, "entropy": 0.32510966062545776, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:46:54.309345Z", "loop": 1064, "env_steps": 654335999, "loss": 0.006413609720766544, "avg_return": 0.3577413260936737, "regret": 0.4466913640499115, "entropy": 0.3418956398963928, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:46:55.514708Z", "loop": 1065, "env_steps": 654950399, "loss": 0.005957215558737516, "avg_return": 0.3701898753643036, "regret": 0.4359471797943115, "entropy": 0.3750959634780884, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:46:56.676300Z", "loop": 1066, "env_steps": 655564799, "loss": 0.006033628713339567, "avg_return": 0.364641010761261, "regret": 0.4359471797943115, "entropy": 0.3995233178138733, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:46:57.840593Z", "loop": 1067, "env_steps": 656179199, "loss": 0.006682502571493387, "avg_return": 0.371188759803772, "regret": 0.4359471797943115, "entropy": 0.40541085600852966, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:46:59.002899Z", "loop": 1068, "env_steps": 656793599, "loss": 0.00574519345536828, "avg_return": 0.3737134635448456, "regret": 0.4359471797943115, "entropy": 0.42794764041900635, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:47:00.163419Z", "loop": 1069, "env_steps": 657407999, "loss": 0.0068022566847503185, "avg_return": 0.3724905550479889, "regret": 0.4359471797943115, "entropy": 0.40385425090789795, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:47:01.379829Z", "loop": 1070, "env_steps": 658022399, "loss": 0.006202287971973419, "avg_return": 0.36306342482566833, "regret": 0.4361094832420349, "entropy": 0.4023350477218628, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:47:02.542847Z", "loop": 1071, "env_steps": 658636799, "loss": 0.005733546335250139, "avg_return": 0.36743277311325073, "regret": 0.4361094832420349, "entropy": 0.39872169494628906, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:47:03.702161Z", "loop": 1072, "env_steps": 659251199, "loss": 0.0068871318362653255, "avg_return": 0.36952006816864014, "regret": 0.4361094832420349, "entropy": 0.37026289105415344, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:47:04.863146Z", "loop": 1073, "env_steps": 659865599, "loss": 0.005889759864658117, "avg_return": 0.36525219678878784, "regret": 0.4361094832420349, "entropy": 0.36833012104034424, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:47:06.022873Z", "loop": 1074, "env_steps": 660479999, "loss": 0.0064246985130012035, "avg_return": 0.36744239926338196, "regret": 0.4361094832420349, "entropy": 0.3750866651535034, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:47:07.230097Z", "loop": 1075, "env_steps": 661094399, "loss": 0.006188852246850729, "avg_return": 0.368346244096756, "regret": 0.4344603717327118, "entropy": 0.39101094007492065, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:47:08.390708Z", "loop": 1076, "env_steps": 661708799, "loss": 0.006042318884283304, "avg_return": 0.36966121196746826, "regret": 0.4344603717327118, "entropy": 0.4164748787879944, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:47:09.552191Z", "loop": 1077, "env_steps": 662323199, "loss": 0.006044969893991947, "avg_return": 0.36591652035713196, "regret": 0.4344603717327118, "entropy": 0.4090096950531006, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:47:10.712160Z", "loop": 1078, "env_steps": 662937599, "loss": 0.0058737704530358315, "avg_return": 0.3707941770553589, "regret": 0.4344603717327118, "entropy": 0.4002363681793213, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:47:11.873242Z", "loop": 1079, "env_steps": 663551999, "loss": 0.0052641634829342365, "avg_return": 0.3741694688796997, "regret": 0.4344603717327118, "entropy": 0.38357630372047424, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:47:13.082176Z", "loop": 1080, "env_steps": 664166399, "loss": 0.005323446821421385, "avg_return": 0.36936455965042114, "regret": 0.43150052428245544, "entropy": 0.3520033061504364, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:47:14.245351Z", "loop": 1081, "env_steps": 664780799, "loss": 0.005773819983005524, "avg_return": 0.36873918771743774, "regret": 0.43150052428245544, "entropy": 0.3150600492954254, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:47:15.407233Z", "loop": 1082, "env_steps": 665395199, "loss": 0.005746245384216309, "avg_return": 0.37395167350769043, "regret": 0.43150052428245544, "entropy": 0.2869604825973511, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:47:16.568715Z", "loop": 1083, "env_steps": 666009599, "loss": 0.005489734001457691, "avg_return": 0.3644082844257355, "regret": 0.43150052428245544, "entropy": 0.27517393231391907, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:47:17.729242Z", "loop": 1084, "env_steps": 666623999, "loss": 0.0052278777584433556, "avg_return": 0.3686826229095459, "regret": 0.43150052428245544, "entropy": 0.24765676259994507, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:47:18.940907Z", "loop": 1085, "env_steps": 667238399, "loss": 0.0057278964668512344, "avg_return": 0.36631858348846436, "regret": 0.4371615946292877, "entropy": 0.24112433195114136, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:47:20.101391Z", "loop": 1086, "env_steps": 667852799, "loss": 0.005403926130384207, "avg_return": 0.36584439873695374, "regret": 0.4371615946292877, "entropy": 0.270961195230484, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:47:21.261247Z", "loop": 1087, "env_steps": 668467199, "loss": 0.005360197275876999, "avg_return": 0.37944495677948, "regret": 0.4371615946292877, "entropy": 0.3046223521232605, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:47:22.424038Z", "loop": 1088, "env_steps": 669081599, "loss": 0.005591321270912886, "avg_return": 0.3739471137523651, "regret": 0.4371615946292877, "entropy": 0.30262020230293274, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:47:23.583522Z", "loop": 1089, "env_steps": 669695999, "loss": 0.005176772829145193, "avg_return": 0.3736743628978729, "regret": 0.4371615946292877, "entropy": 0.2968839704990387, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:47:24.788490Z", "loop": 1090, "env_steps": 670310399, "loss": 0.005148975178599358, "avg_return": 0.368879109621048, "regret": 0.4297216832637787, "entropy": 0.31114065647125244, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:47:25.949674Z", "loop": 1091, "env_steps": 670924799, "loss": 0.005230157636106014, "avg_return": 0.37980443239212036, "regret": 0.4297216832637787, "entropy": 0.32903018593788147, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:47:27.113457Z", "loop": 1092, "env_steps": 671539199, "loss": 0.005361686926335096, "avg_return": 0.3803211450576782, "regret": 0.4297216832637787, "entropy": 0.35833683609962463, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:47:28.272461Z", "loop": 1093, "env_steps": 672153599, "loss": 0.005450563505291939, "avg_return": 0.3826664388179779, "regret": 0.4297216832637787, "entropy": 0.36933308839797974, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:47:29.434403Z", "loop": 1094, "env_steps": 672767999, "loss": 0.005173963960260153, "avg_return": 0.37183845043182373, "regret": 0.4297216832637787, "entropy": 0.38129353523254395, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:47:30.643822Z", "loop": 1095, "env_steps": 673382399, "loss": 0.005976835265755653, "avg_return": 0.3854580819606781, "regret": 0.427376925945282, "entropy": 0.38170963525772095, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:47:31.804483Z", "loop": 1096, "env_steps": 673996799, "loss": 0.00518380431458354, "avg_return": 0.37718796730041504, "regret": 0.427376925945282, "entropy": 0.3713546395301819, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:47:32.964878Z", "loop": 1097, "env_steps": 674611199, "loss": 0.005108647048473358, "avg_return": 0.37485137581825256, "regret": 0.427376925945282, "entropy": 0.3661998212337494, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:47:34.127533Z", "loop": 1098, "env_steps": 675225599, "loss": 0.00506462249904871, "avg_return": 0.3809203803539276, "regret": 0.427376925945282, "entropy": 0.37082603573799133, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:47:35.290883Z", "loop": 1099, "env_steps": 675839999, "loss": 0.005219423212110996, "avg_return": 0.3759904205799103, "regret": 0.427376925945282, "entropy": 0.3810313642024994, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:47:36.494490Z", "loop": 1100, "env_steps": 676454399, "loss": 0.005863155238330364, "avg_return": 0.3781220316886902, "regret": 0.4257567822933197, "entropy": 0.3805864453315735, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:47:37.652958Z", "loop": 1101, "env_steps": 677068799, "loss": 0.0049215080216526985, "avg_return": 0.3691541850566864, "regret": 0.4257567822933197, "entropy": 0.37703102827072144, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:47:38.812866Z", "loop": 1102, "env_steps": 677683199, "loss": 0.00537918834015727, "avg_return": 0.3743484914302826, "regret": 0.4257567822933197, "entropy": 0.3239935338497162, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:47:39.971848Z", "loop": 1103, "env_steps": 678297599, "loss": 0.004753501620143652, "avg_return": 0.3750854730606079, "regret": 0.4257567822933197, "entropy": 0.28091368079185486, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:47:41.131644Z", "loop": 1104, "env_steps": 678911999, "loss": 0.00472751772031188, "avg_return": 0.37543433904647827, "regret": 0.4257567822933197, "entropy": 0.2521710991859436, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:47:42.334441Z", "loop": 1105, "env_steps": 679526399, "loss": 0.004833012819290161, "avg_return": 0.3772571384906769, "regret": 0.428648978471756, "entropy": 0.24756211042404175, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:47:43.493692Z", "loop": 1106, "env_steps": 680140799, "loss": 0.004857861902564764, "avg_return": 0.3776891529560089, "regret": 0.428648978471756, "entropy": 0.2644558250904083, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:47:44.653161Z", "loop": 1107, "env_steps": 680755199, "loss": 0.004583705682307482, "avg_return": 0.3770091235637665, "regret": 0.428648978471756, "entropy": 0.3243604004383087, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:47:45.813002Z", "loop": 1108, "env_steps": 681369599, "loss": 0.005235899239778519, "avg_return": 0.37391141057014465, "regret": 0.428648978471756, "entropy": 0.3632737100124359, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:47:46.971608Z", "loop": 1109, "env_steps": 681983999, "loss": 0.005245577078312635, "avg_return": 0.38171476125717163, "regret": 0.428648978471756, "entropy": 0.33568957448005676, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:47:48.174976Z", "loop": 1110, "env_steps": 682598399, "loss": 0.005032690707594156, "avg_return": 0.37946781516075134, "regret": 0.4259500503540039, "entropy": 0.2861437499523163, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:47:49.336076Z", "loop": 1111, "env_steps": 683212799, "loss": 0.004568751901388168, "avg_return": 0.3764600455760956, "regret": 0.4259500503540039, "entropy": 0.3016100823879242, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:47:50.496696Z", "loop": 1112, "env_steps": 683827199, "loss": 0.005042755976319313, "avg_return": 0.37752947211265564, "regret": 0.4259500503540039, "entropy": 0.32632219791412354, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:47:51.655739Z", "loop": 1113, "env_steps": 684441599, "loss": 0.0051360600627958775, "avg_return": 0.38082432746887207, "regret": 0.4259500503540039, "entropy": 0.34937065839767456, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:47:52.815836Z", "loop": 1114, "env_steps": 685055999, "loss": 0.005588369444012642, "avg_return": 0.38258159160614014, "regret": 0.4259500503540039, "entropy": 0.35408133268356323, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:47:54.022641Z", "loop": 1115, "env_steps": 685670399, "loss": 0.0055129691027104855, "avg_return": 0.3849497437477112, "regret": 0.42195403575897217, "entropy": 0.3464224636554718, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:47:55.187996Z", "loop": 1116, "env_steps": 686284799, "loss": 0.005184364039450884, "avg_return": 0.37925034761428833, "regret": 0.42195403575897217, "entropy": 0.32307156920433044, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:47:56.348367Z", "loop": 1117, "env_steps": 686899199, "loss": 0.004628888331353664, "avg_return": 0.3793416917324066, "regret": 0.42195403575897217, "entropy": 0.30851393938064575, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:47:57.513022Z", "loop": 1118, "env_steps": 687513599, "loss": 0.004925094544887543, "avg_return": 0.39006882905960083, "regret": 0.42195403575897217, "entropy": 0.29460760951042175, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:47:58.673888Z", "loop": 1119, "env_steps": 688127999, "loss": 0.00468275835737586, "avg_return": 0.3860701620578766, "regret": 0.42195403575897217, "entropy": 0.27891039848327637, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:47:59.876797Z", "loop": 1120, "env_steps": 688742399, "loss": 0.004326266702264547, "avg_return": 0.37923482060432434, "regret": 0.4232648015022278, "entropy": 0.25756558775901794, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:48:01.038596Z", "loop": 1121, "env_steps": 689356799, "loss": 0.004443916026502848, "avg_return": 0.374169260263443, "regret": 0.4232648015022278, "entropy": 0.24934843182563782, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:48:02.198387Z", "loop": 1122, "env_steps": 689971199, "loss": 0.004482851829379797, "avg_return": 0.38058915734291077, "regret": 0.4232648015022278, "entropy": 0.25437793135643005, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:48:03.358717Z", "loop": 1123, "env_steps": 690585599, "loss": 0.004377198405563831, "avg_return": 0.37498506903648376, "regret": 0.4232648015022278, "entropy": 0.25808805227279663, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:48:04.518404Z", "loop": 1124, "env_steps": 691199999, "loss": 0.0045150090008974075, "avg_return": 0.37778085470199585, "regret": 0.4232648015022278, "entropy": 0.25976744294166565, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:48:05.726261Z", "loop": 1125, "env_steps": 691814399, "loss": 0.0043226624839007854, "avg_return": 0.37775707244873047, "regret": 0.4219494163990021, "entropy": 0.25794610381126404, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:48:06.885902Z", "loop": 1126, "env_steps": 692428799, "loss": 0.004517667926847935, "avg_return": 0.378172367811203, "regret": 0.4219494163990021, "entropy": 0.27200847864151, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:48:08.050960Z", "loop": 1127, "env_steps": 693043199, "loss": 0.004644216038286686, "avg_return": 0.37982696294784546, "regret": 0.4219494163990021, "entropy": 0.30169233679771423, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:48:09.211430Z", "loop": 1128, "env_steps": 693657599, "loss": 0.004236920736730099, "avg_return": 0.39367184042930603, "regret": 0.4219494163990021, "entropy": 0.32479429244995117, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:48:10.374178Z", "loop": 1129, "env_steps": 694271999, "loss": 0.005602313205599785, "avg_return": 0.38945186138153076, "regret": 0.4219494163990021, "entropy": 0.3345281779766083, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:48:11.584779Z", "loop": 1130, "env_steps": 694886399, "loss": 0.004899319261312485, "avg_return": 0.3900817334651947, "regret": 0.41700032353401184, "entropy": 0.3509906828403473, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:48:12.744154Z", "loop": 1131, "env_steps": 695500799, "loss": 0.004904671106487513, "avg_return": 0.3783439099788666, "regret": 0.41700032353401184, "entropy": 0.3496922254562378, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:48:13.902719Z", "loop": 1132, "env_steps": 696115199, "loss": 0.004644733387976885, "avg_return": 0.38320431113243103, "regret": 0.41700032353401184, "entropy": 0.3567693531513214, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:48:15.062031Z", "loop": 1133, "env_steps": 696729599, "loss": 0.005268215201795101, "avg_return": 0.39012736082077026, "regret": 0.41700032353401184, "entropy": 0.3312276601791382, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:48:16.221461Z", "loop": 1134, "env_steps": 697343999, "loss": 0.004884250927716494, "avg_return": 0.38971278071403503, "regret": 0.41700032353401184, "entropy": 0.31106364727020264, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:48:17.426497Z", "loop": 1135, "env_steps": 697958399, "loss": 0.004800119437277317, "avg_return": 0.3910142779350281, "regret": 0.4156268239021301, "entropy": 0.3245948255062103, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:48:18.585553Z", "loop": 1136, "env_steps": 698572799, "loss": 0.0049977838061749935, "avg_return": 0.3855820894241333, "regret": 0.4156268239021301, "entropy": 0.3225153088569641, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:48:19.744464Z", "loop": 1137, "env_steps": 699187199, "loss": 0.005442620255053043, "avg_return": 0.3952076733112335, "regret": 0.4156268239021301, "entropy": 0.3363306224346161, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:48:20.903395Z", "loop": 1138, "env_steps": 699801599, "loss": 0.005227876361459494, "avg_return": 0.3882945775985718, "regret": 0.4156268239021301, "entropy": 0.3482213616371155, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:48:22.062934Z", "loop": 1139, "env_steps": 700415999, "loss": 0.00519671430811286, "avg_return": 0.3786720037460327, "regret": 0.4156268239021301, "entropy": 0.3514036238193512, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:48:23.267141Z", "loop": 1140, "env_steps": 701030399, "loss": 0.005584725644439459, "avg_return": 0.39245110750198364, "regret": 0.4132234454154968, "entropy": 0.34143951535224915, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:48:24.427180Z", "loop": 1141, "env_steps": 701644799, "loss": 0.005205524154007435, "avg_return": 0.3915589153766632, "regret": 0.4132234454154968, "entropy": 0.32919013500213623, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:48:25.586383Z", "loop": 1142, "env_steps": 702259199, "loss": 0.005793902091681957, "avg_return": 0.38826292753219604, "regret": 0.4132234454154968, "entropy": 0.3024500608444214, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:48:26.747125Z", "loop": 1143, "env_steps": 702873599, "loss": 0.005895904265344143, "avg_return": 0.3963702917098999, "regret": 0.4132234454154968, "entropy": 0.30054715275764465, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:48:27.907913Z", "loop": 1144, "env_steps": 703487999, "loss": 0.005725042428821325, "avg_return": 0.3979039490222931, "regret": 0.4132234454154968, "entropy": 0.3190811276435852, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:48:29.113568Z", "loop": 1145, "env_steps": 704102399, "loss": 0.005560498684644699, "avg_return": 0.39184895157814026, "regret": 0.4117521643638611, "entropy": 0.33607327938079834, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:48:30.272959Z", "loop": 1146, "env_steps": 704716799, "loss": 0.00544801726937294, "avg_return": 0.3911237120628357, "regret": 0.4117521643638611, "entropy": 0.3543006479740143, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:48:31.432992Z", "loop": 1147, "env_steps": 705331199, "loss": 0.005212034564465284, "avg_return": 0.389554888010025, "regret": 0.4117521643638611, "entropy": 0.3435322344303131, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:48:32.592750Z", "loop": 1148, "env_steps": 705945599, "loss": 0.005924067925661802, "avg_return": 0.39098191261291504, "regret": 0.4117521643638611, "entropy": 0.3306043744087219, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:48:33.753259Z", "loop": 1149, "env_steps": 706559999, "loss": 0.0056372759863734245, "avg_return": 0.3932262659072876, "regret": 0.4117521643638611, "entropy": 0.325483500957489, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:48:34.959049Z", "loop": 1150, "env_steps": 707174399, "loss": 0.005632398650050163, "avg_return": 0.3960387408733368, "regret": 0.40831440687179565, "entropy": 0.32536301016807556, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:48:36.121277Z", "loop": 1151, "env_steps": 707788799, "loss": 0.005276919808238745, "avg_return": 0.39450353384017944, "regret": 0.40831440687179565, "entropy": 0.3164082467556, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:48:37.281520Z", "loop": 1152, "env_steps": 708403199, "loss": 0.004991353023797274, "avg_return": 0.38871684670448303, "regret": 0.40831440687179565, "entropy": 0.30972015857696533, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:48:38.444633Z", "loop": 1153, "env_steps": 709017599, "loss": 0.005389607977122068, "avg_return": 0.4014485776424408, "regret": 0.40831440687179565, "entropy": 0.309062123298645, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:48:39.604852Z", "loop": 1154, "env_steps": 709631999, "loss": 0.005131612531840801, "avg_return": 0.3945372998714447, "regret": 0.40831440687179565, "entropy": 0.3010229468345642, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:48:40.809816Z", "loop": 1155, "env_steps": 710246399, "loss": 0.005539063364267349, "avg_return": 0.3959711194038391, "regret": 0.406154066324234, "entropy": 0.31892696022987366, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:48:41.971284Z", "loop": 1156, "env_steps": 710860799, "loss": 0.005496952682733536, "avg_return": 0.39885255694389343, "regret": 0.406154066324234, "entropy": 0.33321237564086914, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:48:43.133685Z", "loop": 1157, "env_steps": 711475199, "loss": 0.005845433101058006, "avg_return": 0.40652456879615784, "regret": 0.406154066324234, "entropy": 0.3377998173236847, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:48:44.295262Z", "loop": 1158, "env_steps": 712089599, "loss": 0.005249197129160166, "avg_return": 0.3957381844520569, "regret": 0.406154066324234, "entropy": 0.3349502682685852, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:48:45.454981Z", "loop": 1159, "env_steps": 712703999, "loss": 0.005834366660565138, "avg_return": 0.39841336011886597, "regret": 0.406154066324234, "entropy": 0.326741099357605, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:48:46.662967Z", "loop": 1160, "env_steps": 713318399, "loss": 0.00532665615901351, "avg_return": 0.3959232568740845, "regret": 0.40365922451019287, "entropy": 0.32440924644470215, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:48:47.823167Z", "loop": 1161, "env_steps": 713932799, "loss": 0.00538346404209733, "avg_return": 0.40169602632522583, "regret": 0.40365922451019287, "entropy": 0.32999956607818604, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:48:48.983212Z", "loop": 1162, "env_steps": 714547199, "loss": 0.0056073288433253765, "avg_return": 0.40595293045043945, "regret": 0.40365922451019287, "entropy": 0.32229599356651306, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:48:50.143239Z", "loop": 1163, "env_steps": 715161599, "loss": 0.005495772231370211, "avg_return": 0.4040192663669586, "regret": 0.40365922451019287, "entropy": 0.3235337734222412, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:48:51.303549Z", "loop": 1164, "env_steps": 715775999, "loss": 0.005428930278867483, "avg_return": 0.392927885055542, "regret": 0.40365922451019287, "entropy": 0.3169824779033661, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:48:52.508000Z", "loop": 1165, "env_steps": 716390399, "loss": 0.00581989623606205, "avg_return": 0.40281692147254944, "regret": 0.4009423851966858, "entropy": 0.3247237205505371, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:48:53.669289Z", "loop": 1166, "env_steps": 717004799, "loss": 0.005337127484381199, "avg_return": 0.4082498252391815, "regret": 0.4009423851966858, "entropy": 0.3235510289669037, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:48:54.828698Z", "loop": 1167, "env_steps": 717619199, "loss": 0.004967156797647476, "avg_return": 0.39914730191230774, "regret": 0.4009423851966858, "entropy": 0.32874494791030884, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:48:55.989813Z", "loop": 1168, "env_steps": 718233599, "loss": 0.005860679782927036, "avg_return": 0.40309175848960876, "regret": 0.4009423851966858, "entropy": 0.3003309369087219, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:48:57.148375Z", "loop": 1169, "env_steps": 718847999, "loss": 0.0053578950464725494, "avg_return": 0.4090949594974518, "regret": 0.4009423851966858, "entropy": 0.2964317500591278, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:48:58.350121Z", "loop": 1170, "env_steps": 719462399, "loss": 0.005181174259632826, "avg_return": 0.3959725499153137, "regret": 0.40254443883895874, "entropy": 0.2931598722934723, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:48:59.508400Z", "loop": 1171, "env_steps": 720076799, "loss": 0.0053506395779550076, "avg_return": 0.400204062461853, "regret": 0.40254443883895874, "entropy": 0.30239591002464294, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:49:00.667066Z", "loop": 1172, "env_steps": 720691199, "loss": 0.005470918025821447, "avg_return": 0.4013791084289551, "regret": 0.40254443883895874, "entropy": 0.322411447763443, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:49:01.826559Z", "loop": 1173, "env_steps": 721305599, "loss": 0.0054311929270625114, "avg_return": 0.4146674573421478, "regret": 0.40254443883895874, "entropy": 0.3111269772052765, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:49:02.986747Z", "loop": 1174, "env_steps": 721919999, "loss": 0.005778188351541758, "avg_return": 0.4029509127140045, "regret": 0.40254443883895874, "entropy": 0.3015859127044678, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:49:04.190823Z", "loop": 1175, "env_steps": 722534399, "loss": 0.005787535570561886, "avg_return": 0.4060077369213104, "regret": 0.39810240268707275, "entropy": 0.28900980949401855, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:49:05.350786Z", "loop": 1176, "env_steps": 723148799, "loss": 0.005881264340132475, "avg_return": 0.40834078192710876, "regret": 0.39810240268707275, "entropy": 0.29508307576179504, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:49:06.509271Z", "loop": 1177, "env_steps": 723763199, "loss": 0.005347067955881357, "avg_return": 0.41260474920272827, "regret": 0.39810240268707275, "entropy": 0.3025064766407013, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:49:07.667208Z", "loop": 1178, "env_steps": 724377599, "loss": 0.005867672618478537, "avg_return": 0.4128172993659973, "regret": 0.39810240268707275, "entropy": 0.3153936564922333, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:49:08.826560Z", "loop": 1179, "env_steps": 724991999, "loss": 0.0056548635475337505, "avg_return": 0.41469520330429077, "regret": 0.39810240268707275, "entropy": 0.3057619333267212, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:49:10.029891Z", "loop": 1180, "env_steps": 725606399, "loss": 0.005453317426145077, "avg_return": 0.40299952030181885, "regret": 0.3968082070350647, "entropy": 0.29205748438835144, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:49:11.189448Z", "loop": 1181, "env_steps": 726220799, "loss": 0.005120542831718922, "avg_return": 0.39392608404159546, "regret": 0.3968082070350647, "entropy": 0.2822873294353485, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:49:12.348396Z", "loop": 1182, "env_steps": 726835199, "loss": 0.0051832436583936214, "avg_return": 0.40430518984794617, "regret": 0.3968082070350647, "entropy": 0.2775730788707733, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:49:13.507445Z", "loop": 1183, "env_steps": 727449599, "loss": 0.005295757204294205, "avg_return": 0.4086991846561432, "regret": 0.3968082070350647, "entropy": 0.29371556639671326, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:49:14.668182Z", "loop": 1184, "env_steps": 728063999, "loss": 0.004967827349901199, "avg_return": 0.4063771665096283, "regret": 0.3968082070350647, "entropy": 0.3183876574039459, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:49:15.873277Z", "loop": 1185, "env_steps": 728678399, "loss": 0.005843957886099815, "avg_return": 0.41778111457824707, "regret": 0.3897469639778137, "entropy": 0.32310181856155396, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:49:17.031900Z", "loop": 1186, "env_steps": 729292799, "loss": 0.0066452003084123135, "avg_return": 0.4096338152885437, "regret": 0.3897469639778137, "entropy": 0.2895044684410095, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:49:18.191330Z", "loop": 1187, "env_steps": 729907199, "loss": 0.0063194818794727325, "avg_return": 0.4058469235897064, "regret": 0.3897469639778137, "entropy": 0.2821902930736542, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:49:19.350396Z", "loop": 1188, "env_steps": 730521599, "loss": 0.006266253534704447, "avg_return": 0.39205190539360046, "regret": 0.3897469639778137, "entropy": 0.2478950023651123, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:49:20.509341Z", "loop": 1189, "env_steps": 731135999, "loss": 0.0066716051660478115, "avg_return": 0.40178173780441284, "regret": 0.3897469639778137, "entropy": 0.23922330141067505, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:49:21.715723Z", "loop": 1190, "env_steps": 731750399, "loss": 0.006154713686555624, "avg_return": 0.390186607837677, "regret": 0.4087224304676056, "entropy": 0.23617446422576904, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:49:22.875929Z", "loop": 1191, "env_steps": 732364799, "loss": 0.006667390000075102, "avg_return": 0.4020208418369293, "regret": 0.4087224304676056, "entropy": 0.2472001612186432, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:49:24.034726Z", "loop": 1192, "env_steps": 732979199, "loss": 0.006223027128726244, "avg_return": 0.40871772170066833, "regret": 0.4087224304676056, "entropy": 0.26972538232803345, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:49:25.194648Z", "loop": 1193, "env_steps": 733593599, "loss": 0.006832115352153778, "avg_return": 0.42097795009613037, "regret": 0.4087224304676056, "entropy": 0.30776381492614746, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:49:26.355764Z", "loop": 1194, "env_steps": 734207999, "loss": 0.005898402072489262, "avg_return": 0.41472744941711426, "regret": 0.4087224304676056, "entropy": 0.31714242696762085, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:49:27.561357Z", "loop": 1195, "env_steps": 734822399, "loss": 0.005201428197324276, "avg_return": 0.41335856914520264, "regret": 0.3915892243385315, "entropy": 0.3009105324745178, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:49:28.721418Z", "loop": 1196, "env_steps": 735436799, "loss": 0.00503917969763279, "avg_return": 0.4096018671989441, "regret": 0.3915892243385315, "entropy": 0.27901384234428406, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:49:29.881890Z", "loop": 1197, "env_steps": 736051199, "loss": 0.005109942983835936, "avg_return": 0.4104563891887665, "regret": 0.3915892243385315, "entropy": 0.2888557016849518, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:49:31.044060Z", "loop": 1198, "env_steps": 736665599, "loss": 0.005118819884955883, "avg_return": 0.4157463312149048, "regret": 0.3915892243385315, "entropy": 0.2933588922023773, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:49:32.203025Z", "loop": 1199, "env_steps": 737279999, "loss": 0.00581418676301837, "avg_return": 0.42401641607284546, "regret": 0.3915892243385315, "entropy": 0.2997678518295288, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:49:33.404841Z", "loop": 1200, "env_steps": 737894399, "loss": 0.006200476083904505, "avg_return": 0.41787734627723694, "regret": 0.38520967960357666, "entropy": 0.3105887770652771, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:49:34.564713Z", "loop": 1201, "env_steps": 738508799, "loss": 0.005897780880331993, "avg_return": 0.4163846969604492, "regret": 0.38520967960357666, "entropy": 0.3071868419647217, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:49:35.723984Z", "loop": 1202, "env_steps": 739123199, "loss": 0.005852694623172283, "avg_return": 0.42362043261528015, "regret": 0.38520967960357666, "entropy": 0.3005210757255554, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:49:36.883250Z", "loop": 1203, "env_steps": 739737599, "loss": 0.005906525533646345, "avg_return": 0.41602981090545654, "regret": 0.38520967960357666, "entropy": 0.3070717751979828, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:49:38.044006Z", "loop": 1204, "env_steps": 740351999, "loss": 0.0067498036660254, "avg_return": 0.4283079206943512, "regret": 0.38520967960357666, "entropy": 0.30325785279273987, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:49:39.248270Z", "loop": 1205, "env_steps": 740966399, "loss": 0.006432628724724054, "avg_return": 0.42300158739089966, "regret": 0.38163667917251587, "entropy": 0.28960269689559937, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:49:40.410208Z", "loop": 1206, "env_steps": 741580799, "loss": 0.006483281496912241, "avg_return": 0.4182060956954956, "regret": 0.38163667917251587, "entropy": 0.2665226459503174, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:49:41.572749Z", "loop": 1207, "env_steps": 742195199, "loss": 0.006141259800642729, "avg_return": 0.41119736433029175, "regret": 0.38163667917251587, "entropy": 0.2599294185638428, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:49:42.733384Z", "loop": 1208, "env_steps": 742809599, "loss": 0.007122964598238468, "avg_return": 0.4253809154033661, "regret": 0.38163667917251587, "entropy": 0.2645815312862396, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:49:43.892828Z", "loop": 1209, "env_steps": 743423999, "loss": 0.006920190062373877, "avg_return": 0.41266924142837524, "regret": 0.38163667917251587, "entropy": 0.2622324228286743, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:49:45.104426Z", "loop": 1210, "env_steps": 744038399, "loss": 0.006000087596476078, "avg_return": 0.4202597141265869, "regret": 0.3829987049102783, "entropy": 0.2692013382911682, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:49:46.266799Z", "loop": 1211, "env_steps": 744652799, "loss": 0.006646774243563414, "avg_return": 0.42547526955604553, "regret": 0.3829987049102783, "entropy": 0.2762686610221863, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:49:47.426809Z", "loop": 1212, "env_steps": 745267199, "loss": 0.00731157511472702, "avg_return": 0.4278911352157593, "regret": 0.3829987049102783, "entropy": 0.28512313961982727, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:49:48.586054Z", "loop": 1213, "env_steps": 745881599, "loss": 0.006863036658614874, "avg_return": 0.424303263425827, "regret": 0.3829987049102783, "entropy": 0.2832469642162323, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:49:49.746205Z", "loop": 1214, "env_steps": 746495999, "loss": 0.006350745912641287, "avg_return": 0.43294861912727356, "regret": 0.3829987049102783, "entropy": 0.2794208526611328, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:49:50.952592Z", "loop": 1215, "env_steps": 747110399, "loss": 0.006646054331213236, "avg_return": 0.4284401535987854, "regret": 0.3772609531879425, "entropy": 0.28410500288009644, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:49:52.115011Z", "loop": 1216, "env_steps": 747724799, "loss": 0.00622998783364892, "avg_return": 0.42018452286720276, "regret": 0.3772609531879425, "entropy": 0.2939775586128235, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:49:53.275421Z", "loop": 1217, "env_steps": 748339199, "loss": 0.006838440895080566, "avg_return": 0.4252576529979706, "regret": 0.3772609531879425, "entropy": 0.28495052456855774, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:49:54.436135Z", "loop": 1218, "env_steps": 748953599, "loss": 0.006434580776840448, "avg_return": 0.42702072858810425, "regret": 0.3772609531879425, "entropy": 0.2861229181289673, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:49:55.596217Z", "loop": 1219, "env_steps": 749567999, "loss": 0.007078907918184996, "avg_return": 0.43228867650032043, "regret": 0.3772609531879425, "entropy": 0.2803218364715576, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:49:56.802546Z", "loop": 1220, "env_steps": 750182399, "loss": 0.0064360760152339935, "avg_return": 0.42479661107063293, "regret": 0.3751610815525055, "entropy": 0.29570940136909485, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:49:57.962261Z", "loop": 1221, "env_steps": 750796799, "loss": 0.006678110454231501, "avg_return": 0.4339146018028259, "regret": 0.3751610815525055, "entropy": 0.2879820168018341, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:49:59.122305Z", "loop": 1222, "env_steps": 751411199, "loss": 0.006069598253816366, "avg_return": 0.4307360351085663, "regret": 0.3751610815525055, "entropy": 0.28078970313072205, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:50:00.283538Z", "loop": 1223, "env_steps": 752025599, "loss": 0.005274869501590729, "avg_return": 0.41888558864593506, "regret": 0.3751610815525055, "entropy": 0.27307140827178955, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:50:01.443169Z", "loop": 1224, "env_steps": 752639999, "loss": 0.005803701933473349, "avg_return": 0.42187634110450745, "regret": 0.3751610815525055, "entropy": 0.2679528295993805, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:50:02.650812Z", "loop": 1225, "env_steps": 753254399, "loss": 0.004931487608700991, "avg_return": 0.416694700717926, "regret": 0.3816276788711548, "entropy": 0.27046820521354675, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:50:03.815474Z", "loop": 1226, "env_steps": 753868799, "loss": 0.005699932109564543, "avg_return": 0.42851945757865906, "regret": 0.3816276788711548, "entropy": 0.270464152097702, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:50:04.974186Z", "loop": 1227, "env_steps": 754483199, "loss": 0.006825435906648636, "avg_return": 0.4318121373653412, "regret": 0.3816276788711548, "entropy": 0.2843266725540161, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:50:06.133043Z", "loop": 1228, "env_steps": 755097599, "loss": 0.006065565627068281, "avg_return": 0.4321390986442566, "regret": 0.3816276788711548, "entropy": 0.2929428815841675, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:50:07.294657Z", "loop": 1229, "env_steps": 755711999, "loss": 0.006627535913139582, "avg_return": 0.43102937936782837, "regret": 0.3816276788711548, "entropy": 0.27793237566947937, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:50:08.500768Z", "loop": 1230, "env_steps": 756326399, "loss": 0.006861505564302206, "avg_return": 0.42847225069999695, "regret": 0.37617188692092896, "entropy": 0.2526931166648865, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:50:09.663453Z", "loop": 1231, "env_steps": 756940799, "loss": 0.006578243803232908, "avg_return": 0.42391547560691833, "regret": 0.37617188692092896, "entropy": 0.24620744585990906, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:50:10.823295Z", "loop": 1232, "env_steps": 757555199, "loss": 0.006653764750808477, "avg_return": 0.42570582032203674, "regret": 0.37617188692092896, "entropy": 0.24217680096626282, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:50:11.985095Z", "loop": 1233, "env_steps": 758169599, "loss": 0.0063951872289180756, "avg_return": 0.4193821847438812, "regret": 0.37617188692092896, "entropy": 0.23684197664260864, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:50:13.147959Z", "loop": 1234, "env_steps": 758783999, "loss": 0.007116851396858692, "avg_return": 0.42698681354522705, "regret": 0.37617188692092896, "entropy": 0.2526000440120697, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:50:14.353525Z", "loop": 1235, "env_steps": 759398399, "loss": 0.0065494440495967865, "avg_return": 0.43857693672180176, "regret": 0.3722515404224396, "entropy": 0.26819396018981934, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:50:15.512770Z", "loop": 1236, "env_steps": 760012799, "loss": 0.006187550723552704, "avg_return": 0.4310890734195709, "regret": 0.3722515404224396, "entropy": 0.2743307054042816, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:50:16.674556Z", "loop": 1237, "env_steps": 760627199, "loss": 0.005615950562059879, "avg_return": 0.43188315629959106, "regret": 0.3722515404224396, "entropy": 0.25382912158966064, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:50:17.835440Z", "loop": 1238, "env_steps": 761241599, "loss": 0.0046828496269881725, "avg_return": 0.4261488914489746, "regret": 0.3722515404224396, "entropy": 0.25851649045944214, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:50:18.995843Z", "loop": 1239, "env_steps": 761855999, "loss": 0.005253457929939032, "avg_return": 0.43296754360198975, "regret": 0.3722515404224396, "entropy": 0.246118426322937, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:50:20.202693Z", "loop": 1240, "env_steps": 762470399, "loss": 0.004950068425387144, "avg_return": 0.4282304346561432, "regret": 0.3748546540737152, "entropy": 0.2527126371860504, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:50:21.363529Z", "loop": 1241, "env_steps": 763084799, "loss": 0.005526195280253887, "avg_return": 0.43577954173088074, "regret": 0.3748546540737152, "entropy": 0.254287451505661, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:50:22.524065Z", "loop": 1242, "env_steps": 763699199, "loss": 0.005297968629747629, "avg_return": 0.4254453778266907, "regret": 0.3748546540737152, "entropy": 0.2553076446056366, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:50:23.684850Z", "loop": 1243, "env_steps": 764313599, "loss": 0.005091499537229538, "avg_return": 0.4299314022064209, "regret": 0.3748546540737152, "entropy": 0.2542456090450287, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:50:24.844661Z", "loop": 1244, "env_steps": 764927999, "loss": 0.00539373466745019, "avg_return": 0.4284574091434479, "regret": 0.3748546540737152, "entropy": 0.26410654187202454, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:50:26.050425Z", "loop": 1245, "env_steps": 765542399, "loss": 0.006561934947967529, "avg_return": 0.4409482479095459, "regret": 0.37077030539512634, "entropy": 0.2582109868526459, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:50:27.209276Z", "loop": 1246, "env_steps": 766156799, "loss": 0.006053637247532606, "avg_return": 0.43435975909233093, "regret": 0.37077030539512634, "entropy": 0.2656775712966919, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:50:28.368639Z", "loop": 1247, "env_steps": 766771199, "loss": 0.005742342676967382, "avg_return": 0.42851442098617554, "regret": 0.37077030539512634, "entropy": 0.2553432881832123, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:50:29.527396Z", "loop": 1248, "env_steps": 767385599, "loss": 0.006686076521873474, "avg_return": 0.4350176155567169, "regret": 0.37077030539512634, "entropy": 0.25591716170310974, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:50:30.686924Z", "loop": 1249, "env_steps": 767999999, "loss": 0.006095394026488066, "avg_return": 0.42832180857658386, "regret": 0.37077030539512634, "entropy": 0.2554043233394623, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:50:31.891904Z", "loop": 1250, "env_steps": 768614399, "loss": 0.00647351611405611, "avg_return": 0.42994406819343567, "regret": 0.3709425926208496, "entropy": 0.25277867913246155, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:50:33.052391Z", "loop": 1251, "env_steps": 769228799, "loss": 0.006231095641851425, "avg_return": 0.438798189163208, "regret": 0.3709425926208496, "entropy": 0.25066229701042175, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:50:34.212081Z", "loop": 1252, "env_steps": 769843199, "loss": 0.006225747521966696, "avg_return": 0.43512386083602905, "regret": 0.3709425926208496, "entropy": 0.2500191926956177, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:50:35.373422Z", "loop": 1253, "env_steps": 770457599, "loss": 0.006096676457673311, "avg_return": 0.43166911602020264, "regret": 0.3709425926208496, "entropy": 0.2536863088607788, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:50:36.533880Z", "loop": 1254, "env_steps": 771071999, "loss": 0.0061537581495940685, "avg_return": 0.4368791878223419, "regret": 0.3709425926208496, "entropy": 0.25638481974601746, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:50:37.739423Z", "loop": 1255, "env_steps": 771686399, "loss": 0.005356145557016134, "avg_return": 0.44065696001052856, "regret": 0.36976158618927, "entropy": 0.2577786147594452, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:50:38.898195Z", "loop": 1256, "env_steps": 772300799, "loss": 0.00556271942332387, "avg_return": 0.429556280374527, "regret": 0.36976158618927, "entropy": 0.253673255443573, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:50:40.058686Z", "loop": 1257, "env_steps": 772915199, "loss": 0.005228675901889801, "avg_return": 0.4325100779533386, "regret": 0.36976158618927, "entropy": 0.2541309595108032, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:50:41.218839Z", "loop": 1258, "env_steps": 773529599, "loss": 0.005520765203982592, "avg_return": 0.44063377380371094, "regret": 0.36976158618927, "entropy": 0.26230940222740173, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:50:42.378641Z", "loop": 1259, "env_steps": 774143999, "loss": 0.005881137680262327, "avg_return": 0.43420523405075073, "regret": 0.36976158618927, "entropy": 0.25771698355674744, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:50:43.588249Z", "loop": 1260, "env_steps": 774758399, "loss": 0.005764072295278311, "avg_return": 0.43902671337127686, "regret": 0.3695015013217926, "entropy": 0.25926074385643005, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:50:44.749540Z", "loop": 1261, "env_steps": 775372799, "loss": 0.0057675475254654884, "avg_return": 0.43342986702919006, "regret": 0.3695015013217926, "entropy": 0.2634729743003845, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:50:45.908301Z", "loop": 1262, "env_steps": 775987199, "loss": 0.00571587635204196, "avg_return": 0.4322837293148041, "regret": 0.3695015013217926, "entropy": 0.26511409878730774, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:50:47.067158Z", "loop": 1263, "env_steps": 776601599, "loss": 0.006383198779076338, "avg_return": 0.4391433298587799, "regret": 0.3695015013217926, "entropy": 0.2643567621707916, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:50:48.227117Z", "loop": 1264, "env_steps": 777215999, "loss": 0.005912675056606531, "avg_return": 0.4345117211341858, "regret": 0.3695015013217926, "entropy": 0.2579122483730316, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:50:49.432749Z", "loop": 1265, "env_steps": 777830399, "loss": 0.006207944825291634, "avg_return": 0.431088924407959, "regret": 0.3695605993270874, "entropy": 0.25751081109046936, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:50:50.592541Z", "loop": 1266, "env_steps": 778444799, "loss": 0.006245449651032686, "avg_return": 0.4358326196670532, "regret": 0.3695605993270874, "entropy": 0.25714582204818726, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:50:51.752311Z", "loop": 1267, "env_steps": 779059199, "loss": 0.006289210170507431, "avg_return": 0.4376056492328644, "regret": 0.3695605993270874, "entropy": 0.25101572275161743, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:50:52.911074Z", "loop": 1268, "env_steps": 779673599, "loss": 0.006353389471769333, "avg_return": 0.42976075410842896, "regret": 0.3695605993270874, "entropy": 0.2556461691856384, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:50:54.069971Z", "loop": 1269, "env_steps": 780287999, "loss": 0.006480608135461807, "avg_return": 0.42893850803375244, "regret": 0.3695605993270874, "entropy": 0.24207834899425507, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:50:55.277963Z", "loop": 1270, "env_steps": 780902399, "loss": 0.006561861839145422, "avg_return": 0.4290929138660431, "regret": 0.37603914737701416, "entropy": 0.2446601688861847, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:50:56.437837Z", "loop": 1271, "env_steps": 781516799, "loss": 0.006505223456770182, "avg_return": 0.42437124252319336, "regret": 0.37603914737701416, "entropy": 0.2422529011964798, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:50:57.597224Z", "loop": 1272, "env_steps": 782131199, "loss": 0.006149225868284702, "avg_return": 0.4196452796459198, "regret": 0.37603914737701416, "entropy": 0.23543035984039307, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:50:58.756161Z", "loop": 1273, "env_steps": 782745599, "loss": 0.006778208073228598, "avg_return": 0.4351763129234314, "regret": 0.37603914737701416, "entropy": 0.24621719121932983, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:50:59.916417Z", "loop": 1274, "env_steps": 783359999, "loss": 0.006272497121244669, "avg_return": 0.4380721151828766, "regret": 0.37603914737701416, "entropy": 0.25106504559516907, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:51:01.122001Z", "loop": 1275, "env_steps": 783974399, "loss": 0.005609051324427128, "avg_return": 0.4409378170967102, "regret": 0.3680466413497925, "entropy": 0.2519344985485077, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:51:02.280829Z", "loop": 1276, "env_steps": 784588799, "loss": 0.004974246025085449, "avg_return": 0.43567201495170593, "regret": 0.3680466413497925, "entropy": 0.24576391279697418, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:51:03.440471Z", "loop": 1277, "env_steps": 785203199, "loss": 0.004629723262041807, "avg_return": 0.42251452803611755, "regret": 0.3680466413497925, "entropy": 0.23494572937488556, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:51:04.600868Z", "loop": 1278, "env_steps": 785817599, "loss": 0.004601528402417898, "avg_return": 0.42788249254226685, "regret": 0.3680466413497925, "entropy": 0.20775271952152252, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:51:05.760387Z", "loop": 1279, "env_steps": 786431999, "loss": 0.0036972523666918278, "avg_return": 0.42264291644096375, "regret": 0.3680466413497925, "entropy": 0.20679226517677307, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:51:06.967156Z", "loop": 1280, "env_steps": 787046399, "loss": 0.004053942393511534, "avg_return": 0.42558926343917847, "regret": 0.37724125385284424, "entropy": 0.20678094029426575, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:51:08.128292Z", "loop": 1281, "env_steps": 787660799, "loss": 0.0041489670984447, "avg_return": 0.43098700046539307, "regret": 0.37724125385284424, "entropy": 0.21075576543807983, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:51:09.288998Z", "loop": 1282, "env_steps": 788275199, "loss": 0.004637233447283506, "avg_return": 0.432824969291687, "regret": 0.37724125385284424, "entropy": 0.22495150566101074, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:51:10.448568Z", "loop": 1283, "env_steps": 788889599, "loss": 0.005272720009088516, "avg_return": 0.4373481273651123, "regret": 0.37724125385284424, "entropy": 0.2412644624710083, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:51:11.610084Z", "loop": 1284, "env_steps": 789503999, "loss": 0.005090819671750069, "avg_return": 0.4354051351547241, "regret": 0.37724125385284424, "entropy": 0.24619346857070923, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:51:12.817174Z", "loop": 1285, "env_steps": 790118399, "loss": 0.006093886680901051, "avg_return": 0.4387342929840088, "regret": 0.36730048060417175, "entropy": 0.24341736733913422, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:51:13.977109Z", "loop": 1286, "env_steps": 790732799, "loss": 0.0052945720963180065, "avg_return": 0.4298451840877533, "regret": 0.36730048060417175, "entropy": 0.23430870473384857, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:51:15.135976Z", "loop": 1287, "env_steps": 791347199, "loss": 0.006034533027559519, "avg_return": 0.43284064531326294, "regret": 0.36730048060417175, "entropy": 0.22918441891670227, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:51:16.298971Z", "loop": 1288, "env_steps": 791961599, "loss": 0.00573412049561739, "avg_return": 0.4291022717952728, "regret": 0.36730048060417175, "entropy": 0.2185962200164795, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:51:17.476185Z", "loop": 1289, "env_steps": 792575999, "loss": 0.005882136523723602, "avg_return": 0.4230870306491852, "regret": 0.36730048060417175, "entropy": 0.217995747923851, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:51:18.687702Z", "loop": 1290, "env_steps": 793190399, "loss": 0.006488848477602005, "avg_return": 0.42664939165115356, "regret": 0.38194841146469116, "entropy": 0.21271421015262604, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:51:19.849492Z", "loop": 1291, "env_steps": 793804799, "loss": 0.006693393923342228, "avg_return": 0.431623637676239, "regret": 0.38194841146469116, "entropy": 0.2145639955997467, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:51:21.009453Z", "loop": 1292, "env_steps": 794419199, "loss": 0.005732710938900709, "avg_return": 0.43844616413116455, "regret": 0.38194841146469116, "entropy": 0.21882401406764984, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:51:22.171109Z", "loop": 1293, "env_steps": 795033599, "loss": 0.0054931435734033585, "avg_return": 0.4414743185043335, "regret": 0.38194841146469116, "entropy": 0.23293910920619965, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:51:23.330999Z", "loop": 1294, "env_steps": 795647999, "loss": 0.004908848088234663, "avg_return": 0.4317392110824585, "regret": 0.38194841146469116, "entropy": 0.22095118463039398, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:51:24.546619Z", "loop": 1295, "env_steps": 796262399, "loss": 0.004113440401852131, "avg_return": 0.43522360920906067, "regret": 0.37382566928863525, "entropy": 0.20260319113731384, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:51:25.709819Z", "loop": 1296, "env_steps": 796876799, "loss": 0.0036895542871207, "avg_return": 0.4205833077430725, "regret": 0.37382566928863525, "entropy": 0.18804676830768585, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:51:26.870969Z", "loop": 1297, "env_steps": 797491199, "loss": 0.00453995680436492, "avg_return": 0.4087471067905426, "regret": 0.37382566928863525, "entropy": 0.18198131024837494, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:51:28.030262Z", "loop": 1298, "env_steps": 798105599, "loss": 0.004080280661582947, "avg_return": 0.4242212474346161, "regret": 0.37382566928863525, "entropy": 0.18068861961364746, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:51:29.189742Z", "loop": 1299, "env_steps": 798719999, "loss": 0.0034539145417511463, "avg_return": 0.42116594314575195, "regret": 0.37382566928863525, "entropy": 0.1936865597963333, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:51:30.398303Z", "loop": 1300, "env_steps": 799334399, "loss": 0.0040947627276182175, "avg_return": 0.43189531564712524, "regret": 0.3746383786201477, "entropy": 0.19919708371162415, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:51:31.559723Z", "loop": 1301, "env_steps": 799948799, "loss": 0.003880925942212343, "avg_return": 0.42644429206848145, "regret": 0.3746383786201477, "entropy": 0.2025316208600998, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:51:32.722524Z", "loop": 1302, "env_steps": 800563199, "loss": 0.004372712224721909, "avg_return": 0.4330413043498993, "regret": 0.3746383786201477, "entropy": 0.20533473789691925, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:51:33.887057Z", "loop": 1303, "env_steps": 801177599, "loss": 0.004294842015951872, "avg_return": 0.4398852586746216, "regret": 0.3746383786201477, "entropy": 0.2148604840040207, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:51:35.049358Z", "loop": 1304, "env_steps": 801791999, "loss": 0.004552563186734915, "avg_return": 0.433718740940094, "regret": 0.3746383786201477, "entropy": 0.22008934617042542, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:51:36.259730Z", "loop": 1305, "env_steps": 802406399, "loss": 0.00529259629547596, "avg_return": 0.4426997900009155, "regret": 0.36733317375183105, "entropy": 0.22916196286678314, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:51:37.420790Z", "loop": 1306, "env_steps": 803020799, "loss": 0.0053350720554590225, "avg_return": 0.43189215660095215, "regret": 0.36733317375183105, "entropy": 0.2322104275226593, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:51:38.581362Z", "loop": 1307, "env_steps": 803635199, "loss": 0.005708326585590839, "avg_return": 0.4314894676208496, "regret": 0.36733317375183105, "entropy": 0.22163277864456177, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:51:39.742285Z", "loop": 1308, "env_steps": 804249599, "loss": 0.005518258083611727, "avg_return": 0.42824259400367737, "regret": 0.36733317375183105, "entropy": 0.218905508518219, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:51:40.903096Z", "loop": 1309, "env_steps": 804863999, "loss": 0.006218682508915663, "avg_return": 0.4403158128261566, "regret": 0.36733317375183105, "entropy": 0.22227072715759277, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:51:42.111982Z", "loop": 1310, "env_steps": 805478399, "loss": 0.006155186798423529, "avg_return": 0.43650686740875244, "regret": 0.3723727762699127, "entropy": 0.22545404732227325, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:51:43.272900Z", "loop": 1311, "env_steps": 806092799, "loss": 0.006090014241635799, "avg_return": 0.4357653856277466, "regret": 0.3723727762699127, "entropy": 0.21593783795833588, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:51:44.434291Z", "loop": 1312, "env_steps": 806707199, "loss": 0.006080049555748701, "avg_return": 0.4274076521396637, "regret": 0.3723727762699127, "entropy": 0.2170797735452652, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:51:45.594699Z", "loop": 1313, "env_steps": 807321599, "loss": 0.006420563440769911, "avg_return": 0.43634656071662903, "regret": 0.3723727762699127, "entropy": 0.2120315283536911, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:51:46.756303Z", "loop": 1314, "env_steps": 807935999, "loss": 0.005619135219603777, "avg_return": 0.4359486997127533, "regret": 0.3723727762699127, "entropy": 0.21838033199310303, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:51:47.974323Z", "loop": 1315, "env_steps": 808550399, "loss": 0.005755992140620947, "avg_return": 0.4474802315235138, "regret": 0.3671797513961792, "entropy": 0.21898052096366882, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:51:49.135195Z", "loop": 1316, "env_steps": 809164799, "loss": 0.005859383847564459, "avg_return": 0.43477246165275574, "regret": 0.3671797513961792, "entropy": 0.223084956407547, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:51:50.296583Z", "loop": 1317, "env_steps": 809779199, "loss": 0.005519702564924955, "avg_return": 0.43916893005371094, "regret": 0.3671797513961792, "entropy": 0.2169535756111145, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:51:51.456911Z", "loop": 1318, "env_steps": 810393599, "loss": 0.005624963901937008, "avg_return": 0.43381327390670776, "regret": 0.3671797513961792, "entropy": 0.22011494636535645, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:51:52.616670Z", "loop": 1319, "env_steps": 811007999, "loss": 0.005485163535922766, "avg_return": 0.44183868169784546, "regret": 0.3671797513961792, "entropy": 0.21326196193695068, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:51:53.823860Z", "loop": 1320, "env_steps": 811622399, "loss": 0.005845004227012396, "avg_return": 0.43288859724998474, "regret": 0.3656022548675537, "entropy": 0.22341039776802063, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:51:54.984019Z", "loop": 1321, "env_steps": 812236799, "loss": 0.0054930723272264, "avg_return": 0.4302005171775818, "regret": 0.3656022548675537, "entropy": 0.2301894873380661, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:51:56.143209Z", "loop": 1322, "env_steps": 812851199, "loss": 0.005375574808567762, "avg_return": 0.4483104944229126, "regret": 0.3656022548675537, "entropy": 0.229319229722023, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:51:57.304158Z", "loop": 1323, "env_steps": 813465599, "loss": 0.004953356925398111, "avg_return": 0.43989884853363037, "regret": 0.3656022548675537, "entropy": 0.22415566444396973, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:51:58.464152Z", "loop": 1324, "env_steps": 814079999, "loss": 0.004652961622923613, "avg_return": 0.43865129351615906, "regret": 0.3656022548675537, "entropy": 0.2237161099910736, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:51:59.681225Z", "loop": 1325, "env_steps": 814694399, "loss": 0.0042763324454426765, "avg_return": 0.4375719428062439, "regret": 0.3674814999103546, "entropy": 0.2150871753692627, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:52:00.843062Z", "loop": 1326, "env_steps": 815308799, "loss": 0.004401141777634621, "avg_return": 0.44068044424057007, "regret": 0.3674814999103546, "entropy": 0.20383982360363007, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:52:02.002900Z", "loop": 1327, "env_steps": 815923199, "loss": 0.004572515841573477, "avg_return": 0.4397816061973572, "regret": 0.3674814999103546, "entropy": 0.2100605070590973, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:52:03.162425Z", "loop": 1328, "env_steps": 816537599, "loss": 0.004424515180289745, "avg_return": 0.4357287287712097, "regret": 0.3674814999103546, "entropy": 0.20366448163986206, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:52:04.324633Z", "loop": 1329, "env_steps": 817151999, "loss": 0.004353194031864405, "avg_return": 0.4254362881183624, "regret": 0.3674814999103546, "entropy": 0.21614307165145874, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:52:05.533295Z", "loop": 1330, "env_steps": 817766399, "loss": 0.004264875780791044, "avg_return": 0.439850777387619, "regret": 0.3667326867580414, "entropy": 0.21636298298835754, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:52:06.696590Z", "loop": 1331, "env_steps": 818380799, "loss": 0.004573470447212458, "avg_return": 0.4325786530971527, "regret": 0.3667326867580414, "entropy": 0.22131450474262238, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:52:07.857701Z", "loop": 1332, "env_steps": 818995199, "loss": 0.004558610264211893, "avg_return": 0.433891624212265, "regret": 0.3667326867580414, "entropy": 0.21870283782482147, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:52:09.017005Z", "loop": 1333, "env_steps": 819609599, "loss": 0.004758748691529036, "avg_return": 0.4409414231777191, "regret": 0.3667326867580414, "entropy": 0.2140824794769287, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:52:10.179780Z", "loop": 1334, "env_steps": 820223999, "loss": 0.004796733148396015, "avg_return": 0.44257456064224243, "regret": 0.3667326867580414, "entropy": 0.22095629572868347, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:52:11.390330Z", "loop": 1335, "env_steps": 820838399, "loss": 0.0052590519189834595, "avg_return": 0.4407306909561157, "regret": 0.36535876989364624, "entropy": 0.22174857556819916, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:52:12.557036Z", "loop": 1336, "env_steps": 821452799, "loss": 0.004760872106999159, "avg_return": 0.44074490666389465, "regret": 0.36535876989364624, "entropy": 0.2246330976486206, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:52:13.718149Z", "loop": 1337, "env_steps": 822067199, "loss": 0.004830364603549242, "avg_return": 0.4386749267578125, "regret": 0.36535876989364624, "entropy": 0.2309603989124298, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:52:14.879307Z", "loop": 1338, "env_steps": 822681599, "loss": 0.004869111813604832, "avg_return": 0.43092504143714905, "regret": 0.36535876989364624, "entropy": 0.2299971580505371, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:52:16.038862Z", "loop": 1339, "env_steps": 823295999, "loss": 0.005302962847054005, "avg_return": 0.4356074035167694, "regret": 0.36535876989364624, "entropy": 0.23038604855537415, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:52:17.243483Z", "loop": 1340, "env_steps": 823910399, "loss": 0.005444287788122892, "avg_return": 0.44035351276397705, "regret": 0.3646770715713501, "entropy": 0.22472642362117767, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:52:18.403770Z", "loop": 1341, "env_steps": 824524799, "loss": 0.004997079726308584, "avg_return": 0.443699449300766, "regret": 0.3646770715713501, "entropy": 0.22600805759429932, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:52:19.567973Z", "loop": 1342, "env_steps": 825139199, "loss": 0.005656655412167311, "avg_return": 0.4378853440284729, "regret": 0.3646770715713501, "entropy": 0.21699649095535278, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:52:20.735981Z", "loop": 1343, "env_steps": 825753599, "loss": 0.00503160897642374, "avg_return": 0.43453115224838257, "regret": 0.3646770715713501, "entropy": 0.21254855394363403, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:52:21.897563Z", "loop": 1344, "env_steps": 826367999, "loss": 0.0048773931339383125, "avg_return": 0.42232850193977356, "regret": 0.3646770715713501, "entropy": 0.21165625751018524, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:52:23.110114Z", "loop": 1345, "env_steps": 826982399, "loss": 0.005779332481324673, "avg_return": 0.43678247928619385, "regret": 0.36745575070381165, "entropy": 0.20801794528961182, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:52:24.271175Z", "loop": 1346, "env_steps": 827596799, "loss": 0.005718022119253874, "avg_return": 0.43662238121032715, "regret": 0.36745575070381165, "entropy": 0.20676568150520325, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:52:25.433062Z", "loop": 1347, "env_steps": 828211199, "loss": 0.005069330800324678, "avg_return": 0.4301486313343048, "regret": 0.36745575070381165, "entropy": 0.20776884257793427, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:52:26.593869Z", "loop": 1348, "env_steps": 828825599, "loss": 0.005116210784763098, "avg_return": 0.44154563546180725, "regret": 0.36745575070381165, "entropy": 0.20454041659832, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:52:27.761652Z", "loop": 1349, "env_steps": 829439999, "loss": 0.004829623270779848, "avg_return": 0.434268057346344, "regret": 0.36745575070381165, "entropy": 0.2118213176727295, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:52:28.976378Z", "loop": 1350, "env_steps": 830054399, "loss": 0.005260223522782326, "avg_return": 0.4474910497665405, "regret": 0.36463379859924316, "entropy": 0.21452046930789948, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:52:30.138135Z", "loop": 1351, "env_steps": 830668799, "loss": 0.005197419784963131, "avg_return": 0.44269323348999023, "regret": 0.36463379859924316, "entropy": 0.21749809384346008, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:52:31.298859Z", "loop": 1352, "env_steps": 831283199, "loss": 0.005411254707723856, "avg_return": 0.43908071517944336, "regret": 0.36463379859924316, "entropy": 0.22017385065555573, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:52:32.458775Z", "loop": 1353, "env_steps": 831897599, "loss": 0.005272179376333952, "avg_return": 0.4308575689792633, "regret": 0.36463379859924316, "entropy": 0.22498534619808197, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:52:33.619292Z", "loop": 1354, "env_steps": 832511999, "loss": 0.0053978064097464085, "avg_return": 0.4476507306098938, "regret": 0.36463379859924316, "entropy": 0.23445232212543488, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:52:34.824151Z", "loop": 1355, "env_steps": 833126399, "loss": 0.004735259804874659, "avg_return": 0.4387122690677643, "regret": 0.36485737562179565, "entropy": 0.20920705795288086, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:52:35.986647Z", "loop": 1356, "env_steps": 833740799, "loss": 0.004063170403242111, "avg_return": 0.43384239077568054, "regret": 0.36485737562179565, "entropy": 0.19845089316368103, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:52:37.150499Z", "loop": 1357, "env_steps": 834355199, "loss": 0.004011859185993671, "avg_return": 0.43731844425201416, "regret": 0.36485737562179565, "entropy": 0.19301491975784302, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:52:38.314107Z", "loop": 1358, "env_steps": 834969599, "loss": 0.003580240998417139, "avg_return": 0.42308878898620605, "regret": 0.36485737562179565, "entropy": 0.1803005039691925, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:52:39.475409Z", "loop": 1359, "env_steps": 835583999, "loss": 0.0036275696475058794, "avg_return": 0.4269873797893524, "regret": 0.36485737562179565, "entropy": 0.17781414091587067, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:52:40.694299Z", "loop": 1360, "env_steps": 836198399, "loss": 0.003994476981461048, "avg_return": 0.4251721203327179, "regret": 0.37326908111572266, "entropy": 0.17823049426078796, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:52:41.854504Z", "loop": 1361, "env_steps": 836812799, "loss": 0.004037619102746248, "avg_return": 0.42834681272506714, "regret": 0.37326908111572266, "entropy": 0.18280352652072906, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:52:43.014452Z", "loop": 1362, "env_steps": 837427199, "loss": 0.0036373180337250233, "avg_return": 0.43087074160575867, "regret": 0.37326908111572266, "entropy": 0.18928200006484985, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:52:44.175263Z", "loop": 1363, "env_steps": 838041599, "loss": 0.003858789801597595, "avg_return": 0.43893739581108093, "regret": 0.37326908111572266, "entropy": 0.19245795905590057, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:52:45.335155Z", "loop": 1364, "env_steps": 838655999, "loss": 0.004233811050653458, "avg_return": 0.44035208225250244, "regret": 0.37326908111572266, "entropy": 0.20458047091960907, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:52:46.543754Z", "loop": 1365, "env_steps": 839270399, "loss": 0.004649559501558542, "avg_return": 0.4427453279495239, "regret": 0.36443594098091125, "entropy": 0.20478709042072296, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:52:47.705090Z", "loop": 1366, "env_steps": 839884799, "loss": 0.005071157123893499, "avg_return": 0.4327283799648285, "regret": 0.36443594098091125, "entropy": 0.21389780938625336, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:52:48.870073Z", "loop": 1367, "env_steps": 840499199, "loss": 0.004715830087661743, "avg_return": 0.44151702523231506, "regret": 0.36443594098091125, "entropy": 0.21293702721595764, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:52:50.033899Z", "loop": 1368, "env_steps": 841113599, "loss": 0.005225331988185644, "avg_return": 0.4427647590637207, "regret": 0.36443594098091125, "entropy": 0.22267675399780273, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:52:51.196258Z", "loop": 1369, "env_steps": 841727999, "loss": 0.00505467876791954, "avg_return": 0.4412391185760498, "regret": 0.36443594098091125, "entropy": 0.21697069704532623, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:52:52.409440Z", "loop": 1370, "env_steps": 842342399, "loss": 0.005179824773222208, "avg_return": 0.4362330734729767, "regret": 0.36319106817245483, "entropy": 0.21942654252052307, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:52:53.571666Z", "loop": 1371, "env_steps": 842956799, "loss": 0.005935911554843187, "avg_return": 0.4422738254070282, "regret": 0.36319106817245483, "entropy": 0.2149960845708847, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:52:54.731037Z", "loop": 1372, "env_steps": 843571199, "loss": 0.005242415238171816, "avg_return": 0.4431924521923065, "regret": 0.36319106817245483, "entropy": 0.2143658548593521, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:52:55.889738Z", "loop": 1373, "env_steps": 844185599, "loss": 0.004827061202377081, "avg_return": 0.44394227862358093, "regret": 0.36319106817245483, "entropy": 0.20987041294574738, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:52:57.049727Z", "loop": 1374, "env_steps": 844799999, "loss": 0.005241518374532461, "avg_return": 0.43515604734420776, "regret": 0.36319106817245483, "entropy": 0.21551543474197388, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:52:58.253525Z", "loop": 1375, "env_steps": 845414399, "loss": 0.005460223648697138, "avg_return": 0.4336957037448883, "regret": 0.36394837498664856, "entropy": 0.2140861451625824, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:52:59.412369Z", "loop": 1376, "env_steps": 846028799, "loss": 0.0054448386654257774, "avg_return": 0.44310319423675537, "regret": 0.36394837498664856, "entropy": 0.2180512398481369, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:53:00.573157Z", "loop": 1377, "env_steps": 846643199, "loss": 0.005421302746981382, "avg_return": 0.4338782727718353, "regret": 0.36394837498664856, "entropy": 0.21490946412086487, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:53:01.731848Z", "loop": 1378, "env_steps": 847257599, "loss": 0.004894033074378967, "avg_return": 0.43833670020103455, "regret": 0.36394837498664856, "entropy": 0.21644116938114166, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:53:02.890161Z", "loop": 1379, "env_steps": 847871999, "loss": 0.004559204913675785, "avg_return": 0.43598878383636475, "regret": 0.36394837498664856, "entropy": 0.21289965510368347, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:53:04.095140Z", "loop": 1380, "env_steps": 848486399, "loss": 0.005011027678847313, "avg_return": 0.43982017040252686, "regret": 0.36315974593162537, "entropy": 0.20854264497756958, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:53:05.256147Z", "loop": 1381, "env_steps": 849100799, "loss": 0.004869330674409866, "avg_return": 0.43811824917793274, "regret": 0.36315974593162537, "entropy": 0.20824258029460907, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:53:06.415369Z", "loop": 1382, "env_steps": 849715199, "loss": 0.004517262801527977, "avg_return": 0.4513051509857178, "regret": 0.36315974593162537, "entropy": 0.19625315070152283, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:53:07.576881Z", "loop": 1383, "env_steps": 850329599, "loss": 0.004564834292978048, "avg_return": 0.4378693699836731, "regret": 0.36315974593162537, "entropy": 0.2007223218679428, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:53:08.739017Z", "loop": 1384, "env_steps": 850943999, "loss": 0.003801588434726, "avg_return": 0.4416171908378601, "regret": 0.36315974593162537, "entropy": 0.20135745406150818, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:53:09.947649Z", "loop": 1385, "env_steps": 851558399, "loss": 0.0042084516026079655, "avg_return": 0.44650599360466003, "regret": 0.36438947916030884, "entropy": 0.20120148360729218, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:53:11.112228Z", "loop": 1386, "env_steps": 852172799, "loss": 0.004308356903493404, "avg_return": 0.4420010447502136, "regret": 0.36438947916030884, "entropy": 0.20694448053836823, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:53:12.272751Z", "loop": 1387, "env_steps": 852787199, "loss": 0.004776172339916229, "avg_return": 0.4391080439090729, "regret": 0.36438947916030884, "entropy": 0.1967846006155014, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:53:13.436798Z", "loop": 1388, "env_steps": 853401599, "loss": 0.004503174684941769, "avg_return": 0.44444525241851807, "regret": 0.36438947916030884, "entropy": 0.20481304824352264, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:53:14.598442Z", "loop": 1389, "env_steps": 854015999, "loss": 0.004733038600534201, "avg_return": 0.430575966835022, "regret": 0.36438947916030884, "entropy": 0.2103794366121292, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:53:15.815382Z", "loop": 1390, "env_steps": 854630399, "loss": 0.004740732256323099, "avg_return": 0.44978705048561096, "regret": 0.3627799451351166, "entropy": 0.20074644684791565, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:53:16.979881Z", "loop": 1391, "env_steps": 855244799, "loss": 0.004879506770521402, "avg_return": 0.43895187973976135, "regret": 0.3627799451351166, "entropy": 0.18723632395267487, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:53:18.141244Z", "loop": 1392, "env_steps": 855859199, "loss": 0.005298759788274765, "avg_return": 0.45006927847862244, "regret": 0.3627799451351166, "entropy": 0.19558675587177277, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:53:19.304322Z", "loop": 1393, "env_steps": 856473599, "loss": 0.004794063046574593, "avg_return": 0.44252076745033264, "regret": 0.3627799451351166, "entropy": 0.1964181512594223, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:53:20.466081Z", "loop": 1394, "env_steps": 857087999, "loss": 0.005050964187830687, "avg_return": 0.44059571623802185, "regret": 0.3627799451351166, "entropy": 0.19829848408699036, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:53:21.672773Z", "loop": 1395, "env_steps": 857702399, "loss": 0.004743058234453201, "avg_return": 0.443744421005249, "regret": 0.36271795630455017, "entropy": 0.20393379032611847, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:53:22.833774Z", "loop": 1396, "env_steps": 858316799, "loss": 0.0046251616440713406, "avg_return": 0.4404221177101135, "regret": 0.36271795630455017, "entropy": 0.19465869665145874, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:53:23.995787Z", "loop": 1397, "env_steps": 858931199, "loss": 0.004427443724125624, "avg_return": 0.4389978051185608, "regret": 0.36271795630455017, "entropy": 0.19748777151107788, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:53:25.155282Z", "loop": 1398, "env_steps": 859545599, "loss": 0.004612565506249666, "avg_return": 0.4417273998260498, "regret": 0.36271795630455017, "entropy": 0.19791248440742493, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:53:26.315163Z", "loop": 1399, "env_steps": 860159999, "loss": 0.003779124468564987, "avg_return": 0.4366967976093292, "regret": 0.36271795630455017, "entropy": 0.1912519484758377, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:53:27.520937Z", "loop": 1400, "env_steps": 860774399, "loss": 0.0037148860283195972, "avg_return": 0.4395681321620941, "regret": 0.3641980290412903, "entropy": 0.19068503379821777, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:53:28.681621Z", "loop": 1401, "env_steps": 861388799, "loss": 0.003890997264534235, "avg_return": 0.439691424369812, "regret": 0.3641980290412903, "entropy": 0.19514058530330658, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:53:29.841375Z", "loop": 1402, "env_steps": 862003199, "loss": 0.0035806179512292147, "avg_return": 0.44194352626800537, "regret": 0.3641980290412903, "entropy": 0.1904919296503067, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:53:31.001035Z", "loop": 1403, "env_steps": 862617599, "loss": 0.003644993994385004, "avg_return": 0.4343768358230591, "regret": 0.3641980290412903, "entropy": 0.18915092945098877, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:53:32.160214Z", "loop": 1404, "env_steps": 863231999, "loss": 0.0034817587584257126, "avg_return": 0.4386554956436157, "regret": 0.3641980290412903, "entropy": 0.1815481334924698, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:53:33.370393Z", "loop": 1405, "env_steps": 863846399, "loss": 0.003449724754318595, "avg_return": 0.43562379479408264, "regret": 0.36635512113571167, "entropy": 0.1780463308095932, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:53:34.531991Z", "loop": 1406, "env_steps": 864460799, "loss": 0.0032318835146725178, "avg_return": 0.4389062523841858, "regret": 0.36635512113571167, "entropy": 0.1756194829940796, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:53:35.692125Z", "loop": 1407, "env_steps": 865075199, "loss": 0.0034257720690220594, "avg_return": 0.4383780062198639, "regret": 0.36635512113571167, "entropy": 0.17536026239395142, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:53:36.851459Z", "loop": 1408, "env_steps": 865689599, "loss": 0.0034019630402326584, "avg_return": 0.4369032382965088, "regret": 0.36635512113571167, "entropy": 0.17991745471954346, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:53:38.010918Z", "loop": 1409, "env_steps": 866303999, "loss": 0.0034109465777873993, "avg_return": 0.4369983971118927, "regret": 0.36635512113571167, "entropy": 0.18384963274002075, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:53:39.216559Z", "loop": 1410, "env_steps": 866918399, "loss": 0.0032704004552215338, "avg_return": 0.4401445984840393, "regret": 0.365620881319046, "entropy": 0.1799827367067337, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:53:40.379950Z", "loop": 1411, "env_steps": 867532799, "loss": 0.003673477564007044, "avg_return": 0.4357035458087921, "regret": 0.365620881319046, "entropy": 0.18833403289318085, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:53:41.539918Z", "loop": 1412, "env_steps": 868147199, "loss": 0.0037618421483784914, "avg_return": 0.43437352776527405, "regret": 0.365620881319046, "entropy": 0.19091403484344482, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:53:42.699517Z", "loop": 1413, "env_steps": 868761599, "loss": 0.0039756083860993385, "avg_return": 0.4471420347690582, "regret": 0.365620881319046, "entropy": 0.18767915666103363, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:53:43.860555Z", "loop": 1414, "env_steps": 869375999, "loss": 0.0042329216375947, "avg_return": 0.4471156895160675, "regret": 0.365620881319046, "entropy": 0.1972438246011734, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:53:45.070564Z", "loop": 1415, "env_steps": 869990399, "loss": 0.0042086029425263405, "avg_return": 0.4441118538379669, "regret": 0.3620392084121704, "entropy": 0.1996917724609375, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:53:46.229930Z", "loop": 1416, "env_steps": 870604799, "loss": 0.004395266063511372, "avg_return": 0.4513967037200928, "regret": 0.3620392084121704, "entropy": 0.20085042715072632, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:53:47.389720Z", "loop": 1417, "env_steps": 871219199, "loss": 0.004222255200147629, "avg_return": 0.4376719295978546, "regret": 0.3620392084121704, "entropy": 0.19683687388896942, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:53:48.549067Z", "loop": 1418, "env_steps": 871833599, "loss": 0.004516312386840582, "avg_return": 0.4444478452205658, "regret": 0.3620392084121704, "entropy": 0.20895081758499146, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:53:49.709357Z", "loop": 1419, "env_steps": 872447999, "loss": 0.004643568303436041, "avg_return": 0.43604716658592224, "regret": 0.3620392084121704, "entropy": 0.20481400191783905, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:53:50.917825Z", "loop": 1420, "env_steps": 873062399, "loss": 0.004547599237412214, "avg_return": 0.44009050726890564, "regret": 0.3611360490322113, "entropy": 0.20520249009132385, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:53:52.078153Z", "loop": 1421, "env_steps": 873676799, "loss": 0.004439928103238344, "avg_return": 0.4388371407985687, "regret": 0.3611360490322113, "entropy": 0.20192459225654602, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:53:53.237178Z", "loop": 1422, "env_steps": 874291199, "loss": 0.005051568616181612, "avg_return": 0.4376866817474365, "regret": 0.3611360490322113, "entropy": 0.2070109099149704, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:53:54.401357Z", "loop": 1423, "env_steps": 874905599, "loss": 0.004966448526829481, "avg_return": 0.4502074420452118, "regret": 0.3611360490322113, "entropy": 0.21903657913208008, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:53:55.562274Z", "loop": 1424, "env_steps": 875519999, "loss": 0.005293530877679586, "avg_return": 0.4355190098285675, "regret": 0.3611360490322113, "entropy": 0.21813733875751495, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:53:56.769320Z", "loop": 1425, "env_steps": 876134399, "loss": 0.005304283928126097, "avg_return": 0.445877343416214, "regret": 0.3616954982280731, "entropy": 0.2237829864025116, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:53:57.929851Z", "loop": 1426, "env_steps": 876748799, "loss": 0.00544100534170866, "avg_return": 0.4439397156238556, "regret": 0.3616954982280731, "entropy": 0.22051818668842316, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:53:59.089002Z", "loop": 1427, "env_steps": 877363199, "loss": 0.005182379856705666, "avg_return": 0.43832308053970337, "regret": 0.3616954982280731, "entropy": 0.21811172366142273, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:54:00.249556Z", "loop": 1428, "env_steps": 877977599, "loss": 0.005217782687395811, "avg_return": 0.4438949227333069, "regret": 0.3616954982280731, "entropy": 0.2095453441143036, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:54:01.408559Z", "loop": 1429, "env_steps": 878591999, "loss": 0.005141452420502901, "avg_return": 0.44431251287460327, "regret": 0.3616954982280731, "entropy": 0.2121134251356125, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:54:02.615022Z", "loop": 1430, "env_steps": 879206399, "loss": 0.004589933902025223, "avg_return": 0.44245824217796326, "regret": 0.3607780933380127, "entropy": 0.21629388630390167, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:54:03.773919Z", "loop": 1431, "env_steps": 879820799, "loss": 0.005075507797300816, "avg_return": 0.45041483640670776, "regret": 0.3607780933380127, "entropy": 0.21244022250175476, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:54:04.934193Z", "loop": 1432, "env_steps": 880435199, "loss": 0.004708117339760065, "avg_return": 0.44275960326194763, "regret": 0.3607780933380127, "entropy": 0.2104920595884323, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:54:06.093365Z", "loop": 1433, "env_steps": 881049599, "loss": 0.004349001217633486, "avg_return": 0.44495657086372375, "regret": 0.3607780933380127, "entropy": 0.20441700518131256, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:54:07.252639Z", "loop": 1434, "env_steps": 881663999, "loss": 0.0042836954817175865, "avg_return": 0.44482260942459106, "regret": 0.3607780933380127, "entropy": 0.20267443358898163, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:54:08.458083Z", "loop": 1435, "env_steps": 882278399, "loss": 0.004946691449731588, "avg_return": 0.44719311594963074, "regret": 0.36061280965805054, "entropy": 0.20038698613643646, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:54:09.618425Z", "loop": 1436, "env_steps": 882892799, "loss": 0.0051643638871610165, "avg_return": 0.4491015672683716, "regret": 0.36061280965805054, "entropy": 0.20732301473617554, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:54:10.777684Z", "loop": 1437, "env_steps": 883507199, "loss": 0.004467154387384653, "avg_return": 0.4467814266681671, "regret": 0.36061280965805054, "entropy": 0.20468105375766754, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:54:11.938005Z", "loop": 1438, "env_steps": 884121599, "loss": 0.004671136848628521, "avg_return": 0.4375533163547516, "regret": 0.36061280965805054, "entropy": 0.20987334847450256, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:54:13.097220Z", "loop": 1439, "env_steps": 884735999, "loss": 0.004751561675220728, "avg_return": 0.44727393984794617, "regret": 0.36061280965805054, "entropy": 0.20339414477348328, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:54:14.304106Z", "loop": 1440, "env_steps": 885350399, "loss": 0.004489370156079531, "avg_return": 0.44449886679649353, "regret": 0.36056238412857056, "entropy": 0.20318181812763214, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:54:15.464065Z", "loop": 1441, "env_steps": 885964799, "loss": 0.00465413136407733, "avg_return": 0.44221508502960205, "regret": 0.36056238412857056, "entropy": 0.20765534043312073, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:54:16.625979Z", "loop": 1442, "env_steps": 886579199, "loss": 0.004677757155150175, "avg_return": 0.4414989948272705, "regret": 0.36056238412857056, "entropy": 0.2094004899263382, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:54:17.786291Z", "loop": 1443, "env_steps": 887193599, "loss": 0.004688613582402468, "avg_return": 0.43742144107818604, "regret": 0.36056238412857056, "entropy": 0.20622074604034424, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:54:18.946508Z", "loop": 1444, "env_steps": 887807999, "loss": 0.0043313708156347275, "avg_return": 0.4443187713623047, "regret": 0.36056238412857056, "entropy": 0.19017700850963593, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:54:20.152211Z", "loop": 1445, "env_steps": 888422399, "loss": 0.004227758850902319, "avg_return": 0.44556087255477905, "regret": 0.3603065013885498, "entropy": 0.19643016159534454, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:54:21.311450Z", "loop": 1446, "env_steps": 889036799, "loss": 0.004098846111446619, "avg_return": 0.4431462585926056, "regret": 0.3603065013885498, "entropy": 0.19800347089767456, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:54:22.471371Z", "loop": 1447, "env_steps": 889651199, "loss": 0.004133951384574175, "avg_return": 0.44367554783821106, "regret": 0.3603065013885498, "entropy": 0.18703557550907135, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:54:23.630809Z", "loop": 1448, "env_steps": 890265599, "loss": 0.0034466315992176533, "avg_return": 0.4420105218887329, "regret": 0.3603065013885498, "entropy": 0.1807454228401184, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:54:24.789408Z", "loop": 1449, "env_steps": 890879999, "loss": 0.003916642162948847, "avg_return": 0.44294053316116333, "regret": 0.3603065013885498, "entropy": 0.17922453582286835, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:54:25.994810Z", "loop": 1450, "env_steps": 891494399, "loss": 0.0033668323885649443, "avg_return": 0.44043609499931335, "regret": 0.3620011508464813, "entropy": 0.177765890955925, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:54:27.158116Z", "loop": 1451, "env_steps": 892108799, "loss": 0.0035031908191740513, "avg_return": 0.440220445394516, "regret": 0.3620011508464813, "entropy": 0.17687977850437164, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:54:28.317387Z", "loop": 1452, "env_steps": 892723199, "loss": 0.003510622074827552, "avg_return": 0.4345739483833313, "regret": 0.3620011508464813, "entropy": 0.17756693065166473, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:54:29.475682Z", "loop": 1453, "env_steps": 893337599, "loss": 0.004313531797379255, "avg_return": 0.44644472002983093, "regret": 0.3620011508464813, "entropy": 0.18355052173137665, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:54:30.635297Z", "loop": 1454, "env_steps": 893951999, "loss": 0.004366887733340263, "avg_return": 0.44452059268951416, "regret": 0.3620011508464813, "entropy": 0.19508995115756989, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:54:31.844679Z", "loop": 1455, "env_steps": 894566399, "loss": 0.004447165876626968, "avg_return": 0.43828609585762024, "regret": 0.3600237965583801, "entropy": 0.19458557665348053, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:54:33.005853Z", "loop": 1456, "env_steps": 895180799, "loss": 0.004767765756696463, "avg_return": 0.4444689154624939, "regret": 0.3600237965583801, "entropy": 0.1940487176179886, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:54:34.164015Z", "loop": 1457, "env_steps": 895795199, "loss": 0.005301922559738159, "avg_return": 0.43715527653694153, "regret": 0.3600237965583801, "entropy": 0.2051645666360855, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:54:35.323478Z", "loop": 1458, "env_steps": 896409599, "loss": 0.005321827717125416, "avg_return": 0.44281521439552307, "regret": 0.3600237965583801, "entropy": 0.197050079703331, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:54:36.483107Z", "loop": 1459, "env_steps": 897023999, "loss": 0.004549695644527674, "avg_return": 0.43833619356155396, "regret": 0.3600237965583801, "entropy": 0.1983085423707962, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:54:37.687612Z", "loop": 1460, "env_steps": 897638399, "loss": 0.005137152504175901, "avg_return": 0.44152960181236267, "regret": 0.36029481887817383, "entropy": 0.19317974150180817, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:54:38.846141Z", "loop": 1461, "env_steps": 898252799, "loss": 0.0051309033297002316, "avg_return": 0.4400269687175751, "regret": 0.36029481887817383, "entropy": 0.19522619247436523, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:54:40.005649Z", "loop": 1462, "env_steps": 898867199, "loss": 0.005205430556088686, "avg_return": 0.4400298297405243, "regret": 0.36029481887817383, "entropy": 0.1981329321861267, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:54:41.164725Z", "loop": 1463, "env_steps": 899481599, "loss": 0.004613053519278765, "avg_return": 0.44014838337898254, "regret": 0.36029481887817383, "entropy": 0.20079006254673004, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:54:42.324472Z", "loop": 1464, "env_steps": 900095999, "loss": 0.00426911935210228, "avg_return": 0.4384753406047821, "regret": 0.36029481887817383, "entropy": 0.19751352071762085, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:54:43.529130Z", "loop": 1465, "env_steps": 900710399, "loss": 0.004687828477472067, "avg_return": 0.45232194662094116, "regret": 0.3598150312900543, "entropy": 0.19640694558620453, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:54:44.689459Z", "loop": 1466, "env_steps": 901324799, "loss": 0.00525703327730298, "avg_return": 0.45061397552490234, "regret": 0.3598150312900543, "entropy": 0.19651395082473755, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:54:45.850094Z", "loop": 1467, "env_steps": 901939199, "loss": 0.005141823552548885, "avg_return": 0.4455498456954956, "regret": 0.3598150312900543, "entropy": 0.1855512410402298, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:54:47.010857Z", "loop": 1468, "env_steps": 902553599, "loss": 0.005083736963570118, "avg_return": 0.4440179467201233, "regret": 0.3598150312900543, "entropy": 0.19460266828536987, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:54:48.170843Z", "loop": 1469, "env_steps": 903167999, "loss": 0.005164166912436485, "avg_return": 0.44096243381500244, "regret": 0.3598150312900543, "entropy": 0.19200214743614197, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:54:49.376756Z", "loop": 1470, "env_steps": 903782399, "loss": 0.005216145422309637, "avg_return": 0.4400613605976105, "regret": 0.36230242252349854, "entropy": 0.1937594711780548, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:54:50.535580Z", "loop": 1471, "env_steps": 904396799, "loss": 0.005578651092946529, "avg_return": 0.4443913400173187, "regret": 0.36230242252349854, "entropy": 0.19603349268436432, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:54:51.694801Z", "loop": 1472, "env_steps": 905011199, "loss": 0.004668505396693945, "avg_return": 0.4484851658344269, "regret": 0.36230242252349854, "entropy": 0.19861610233783722, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:54:52.854218Z", "loop": 1473, "env_steps": 905625599, "loss": 0.004355014301836491, "avg_return": 0.4390147626399994, "regret": 0.36230242252349854, "entropy": 0.19549553096294403, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:54:54.014262Z", "loop": 1474, "env_steps": 906239999, "loss": 0.004075794480741024, "avg_return": 0.45037299394607544, "regret": 0.36230242252349854, "entropy": 0.18843607604503632, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:54:55.220575Z", "loop": 1475, "env_steps": 906854399, "loss": 0.00407456187531352, "avg_return": 0.4479113817214966, "regret": 0.3594888746738434, "entropy": 0.19600312411785126, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:54:56.381523Z", "loop": 1476, "env_steps": 907468799, "loss": 0.004213511943817139, "avg_return": 0.4448818564414978, "regret": 0.3594888746738434, "entropy": 0.18612661957740784, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:54:57.540427Z", "loop": 1477, "env_steps": 908083199, "loss": 0.003953933250159025, "avg_return": 0.44777223467826843, "regret": 0.3594888746738434, "entropy": 0.18147124350070953, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:54:58.702301Z", "loop": 1478, "env_steps": 908697599, "loss": 0.004168559331446886, "avg_return": 0.4435274302959442, "regret": 0.3594888746738434, "entropy": 0.18469159305095673, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:54:59.860895Z", "loop": 1479, "env_steps": 909311999, "loss": 0.004021452274173498, "avg_return": 0.4389397203922272, "regret": 0.3594888746738434, "entropy": 0.17631550133228302, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:55:01.064835Z", "loop": 1480, "env_steps": 909926399, "loss": 0.004068033304065466, "avg_return": 0.4429904818534851, "regret": 0.3630339503288269, "entropy": 0.1671978086233139, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:55:02.223391Z", "loop": 1481, "env_steps": 910540799, "loss": 0.004403082188218832, "avg_return": 0.44122910499572754, "regret": 0.3630339503288269, "entropy": 0.17086917161941528, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:55:03.384826Z", "loop": 1482, "env_steps": 911155199, "loss": 0.004387499298900366, "avg_return": 0.43947267532348633, "regret": 0.3630339503288269, "entropy": 0.17513470351696014, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:55:04.545702Z", "loop": 1483, "env_steps": 911769599, "loss": 0.004395912401378155, "avg_return": 0.43623781204223633, "regret": 0.3630339503288269, "entropy": 0.16887691617012024, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:55:05.705074Z", "loop": 1484, "env_steps": 912383999, "loss": 0.0040095592848956585, "avg_return": 0.43843334913253784, "regret": 0.3630339503288269, "entropy": 0.17133492231369019, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:55:06.914077Z", "loop": 1485, "env_steps": 912998399, "loss": 0.004756835754960775, "avg_return": 0.45079731941223145, "regret": 0.3619844615459442, "entropy": 0.17563268542289734, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:55:08.076350Z", "loop": 1486, "env_steps": 913612799, "loss": 0.004271849524229765, "avg_return": 0.4460032284259796, "regret": 0.3619844615459442, "entropy": 0.18854132294654846, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:55:09.237664Z", "loop": 1487, "env_steps": 914227199, "loss": 0.004507758188992739, "avg_return": 0.4478234052658081, "regret": 0.3619844615459442, "entropy": 0.19505995512008667, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:55:10.397137Z", "loop": 1488, "env_steps": 914841599, "loss": 0.004475335590541363, "avg_return": 0.4445722699165344, "regret": 0.3619844615459442, "entropy": 0.20017080008983612, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:55:11.557312Z", "loop": 1489, "env_steps": 915455999, "loss": 0.004414798226207495, "avg_return": 0.43992945551872253, "regret": 0.3619844615459442, "entropy": 0.20916017889976501, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:55:12.762387Z", "loop": 1490, "env_steps": 916070399, "loss": 0.004733213223516941, "avg_return": 0.4424963891506195, "regret": 0.36097320914268494, "entropy": 0.20771870017051697, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:55:13.922273Z", "loop": 1491, "env_steps": 916684799, "loss": 0.004892346914857626, "avg_return": 0.4406617283821106, "regret": 0.36097320914268494, "entropy": 0.2057330310344696, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:55:15.081371Z", "loop": 1492, "env_steps": 917299199, "loss": 0.004580290522426367, "avg_return": 0.4385230243206024, "regret": 0.36097320914268494, "entropy": 0.20448867976665497, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:55:16.241089Z", "loop": 1493, "env_steps": 917913599, "loss": 0.004671439528465271, "avg_return": 0.44465669989585876, "regret": 0.36097320914268494, "entropy": 0.20268256962299347, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:55:17.400115Z", "loop": 1494, "env_steps": 918527999, "loss": 0.004801867064088583, "avg_return": 0.44123002886772156, "regret": 0.36097320914268494, "entropy": 0.19834886491298676, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:55:18.605009Z", "loop": 1495, "env_steps": 919142399, "loss": 0.005223305430263281, "avg_return": 0.43752798438072205, "regret": 0.3666720986366272, "entropy": 0.19181738793849945, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:55:19.763899Z", "loop": 1496, "env_steps": 919756799, "loss": 0.005146516487002373, "avg_return": 0.43842795491218567, "regret": 0.3666720986366272, "entropy": 0.19457894563674927, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:55:20.923870Z", "loop": 1497, "env_steps": 920371199, "loss": 0.004964071791619062, "avg_return": 0.4346035420894623, "regret": 0.3666720986366272, "entropy": 0.1953795850276947, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:55:22.082817Z", "loop": 1498, "env_steps": 920985599, "loss": 0.004822209477424622, "avg_return": 0.44374462962150574, "regret": 0.3666720986366272, "entropy": 0.19002459943294525, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:55:23.243322Z", "loop": 1499, "env_steps": 921599999, "loss": 0.0047084977850317955, "avg_return": 0.4430258274078369, "regret": 0.3666720986366272, "entropy": 0.1897522658109665, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:55:24.448429Z", "loop": 1500, "env_steps": 922214399, "loss": 0.004816858563572168, "avg_return": 0.4431872069835663, "regret": 0.3603774905204773, "entropy": 0.19488655030727386, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:55:25.608558Z", "loop": 1501, "env_steps": 922828799, "loss": 0.004691697657108307, "avg_return": 0.4445923864841461, "regret": 0.3603774905204773, "entropy": 0.19183312356472015, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:55:26.767306Z", "loop": 1502, "env_steps": 923443199, "loss": 0.0038605888839811087, "avg_return": 0.44494420289993286, "regret": 0.3603774905204773, "entropy": 0.17918746173381805, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:55:27.927112Z", "loop": 1503, "env_steps": 924057599, "loss": 0.0036333517637103796, "avg_return": 0.44126027822494507, "regret": 0.3603774905204773, "entropy": 0.17540611326694489, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:55:29.085930Z", "loop": 1504, "env_steps": 924671999, "loss": 0.0032293375115841627, "avg_return": 0.4367119073867798, "regret": 0.3603774905204773, "entropy": 0.16737885773181915, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:55:30.290947Z", "loop": 1505, "env_steps": 925286399, "loss": 0.003429112257435918, "avg_return": 0.4483996629714966, "regret": 0.3600212633609772, "entropy": 0.15893712639808655, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:55:31.450671Z", "loop": 1506, "env_steps": 925900799, "loss": 0.0030215426813811064, "avg_return": 0.45270559191703796, "regret": 0.3600212633609772, "entropy": 0.16071215271949768, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:55:32.611558Z", "loop": 1507, "env_steps": 926515199, "loss": 0.0033182245679199696, "avg_return": 0.4390551447868347, "regret": 0.3600212633609772, "entropy": 0.15954536199569702, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:55:33.770336Z", "loop": 1508, "env_steps": 927129599, "loss": 0.003156050341203809, "avg_return": 0.44225576519966125, "regret": 0.3600212633609772, "entropy": 0.15160326659679413, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:55:34.931167Z", "loop": 1509, "env_steps": 927743999, "loss": 0.0030563361942768097, "avg_return": 0.4403461813926697, "regret": 0.3600212633609772, "entropy": 0.15566222369670868, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:55:36.136012Z", "loop": 1510, "env_steps": 928358399, "loss": 0.0031779264099895954, "avg_return": 0.44215789437294006, "regret": 0.363309383392334, "entropy": 0.1525285542011261, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:55:37.296063Z", "loop": 1511, "env_steps": 928972799, "loss": 0.003107766853645444, "avg_return": 0.4394613802433014, "regret": 0.363309383392334, "entropy": 0.15862923860549927, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:55:38.455071Z", "loop": 1512, "env_steps": 929587199, "loss": 0.003363795345649123, "avg_return": 0.43635284900665283, "regret": 0.363309383392334, "entropy": 0.15349899232387543, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:55:39.615449Z", "loop": 1513, "env_steps": 930201599, "loss": 0.003137820167466998, "avg_return": 0.43762603402137756, "regret": 0.363309383392334, "entropy": 0.15236587822437286, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:55:40.774392Z", "loop": 1514, "env_steps": 930815999, "loss": 0.003102106275036931, "avg_return": 0.4476690888404846, "regret": 0.363309383392334, "entropy": 0.1483953893184662, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:55:41.979023Z", "loop": 1515, "env_steps": 931430399, "loss": 0.002911401679739356, "avg_return": 0.44029200077056885, "regret": 0.36190226674079895, "entropy": 0.15079298615455627, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:55:43.139034Z", "loop": 1516, "env_steps": 932044799, "loss": 0.0029691122472286224, "avg_return": 0.4462065100669861, "regret": 0.36190226674079895, "entropy": 0.1505342572927475, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:55:44.299014Z", "loop": 1517, "env_steps": 932659199, "loss": 0.0032503369729965925, "avg_return": 0.44575464725494385, "regret": 0.36190226674079895, "entropy": 0.1539245992898941, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:55:45.458528Z", "loop": 1518, "env_steps": 933273599, "loss": 0.002994375303387642, "avg_return": 0.44976162910461426, "regret": 0.36190226674079895, "entropy": 0.16145046055316925, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:55:46.621182Z", "loop": 1519, "env_steps": 933887999, "loss": 0.0038798365276306868, "avg_return": 0.44390803575515747, "regret": 0.36190226674079895, "entropy": 0.16242733597755432, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:55:47.825582Z", "loop": 1520, "env_steps": 934502399, "loss": 0.0039051093626767397, "avg_return": 0.4438919723033905, "regret": 0.35872140526771545, "entropy": 0.16493645310401917, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:55:48.985519Z", "loop": 1521, "env_steps": 935116799, "loss": 0.0036589596420526505, "avg_return": 0.44489309191703796, "regret": 0.35872140526771545, "entropy": 0.1717897653579712, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:55:50.149447Z", "loop": 1522, "env_steps": 935731199, "loss": 0.00437177624553442, "avg_return": 0.44736960530281067, "regret": 0.35872140526771545, "entropy": 0.17638856172561646, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:55:51.309719Z", "loop": 1523, "env_steps": 936345599, "loss": 0.004056223668158054, "avg_return": 0.44546225666999817, "regret": 0.35872140526771545, "entropy": 0.17780117690563202, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:55:52.469354Z", "loop": 1524, "env_steps": 936959999, "loss": 0.0039036681409925222, "avg_return": 0.4413069188594818, "regret": 0.35872140526771545, "entropy": 0.1726495921611786, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:55:53.677041Z", "loop": 1525, "env_steps": 937574399, "loss": 0.0046795136295259, "avg_return": 0.44916418194770813, "regret": 0.36002832651138306, "entropy": 0.17186512053012848, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:55:54.835783Z", "loop": 1526, "env_steps": 938188799, "loss": 0.00474720960482955, "avg_return": 0.4480539560317993, "regret": 0.36002832651138306, "entropy": 0.17079193890094757, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:55:55.996734Z", "loop": 1527, "env_steps": 938803199, "loss": 0.004714425187557936, "avg_return": 0.4450945258140564, "regret": 0.36002832651138306, "entropy": 0.1762848198413849, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:55:57.156365Z", "loop": 1528, "env_steps": 939417599, "loss": 0.004531648010015488, "avg_return": 0.43630239367485046, "regret": 0.36002832651138306, "entropy": 0.18002448976039886, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:55:58.315832Z", "loop": 1529, "env_steps": 940031999, "loss": 0.0045555587857961655, "avg_return": 0.4410991668701172, "regret": 0.36002832651138306, "entropy": 0.18486423790454865, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:55:59.520840Z", "loop": 1530, "env_steps": 940646399, "loss": 0.004018268082290888, "avg_return": 0.4472789764404297, "regret": 0.35868796706199646, "entropy": 0.17293177545070648, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:56:00.681160Z", "loop": 1531, "env_steps": 941260799, "loss": 0.003935064654797316, "avg_return": 0.4426565170288086, "regret": 0.35868796706199646, "entropy": 0.1706131398677826, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:56:01.840107Z", "loop": 1532, "env_steps": 941875199, "loss": 0.0036356039345264435, "avg_return": 0.4504113793373108, "regret": 0.35868796706199646, "entropy": 0.16516105830669403, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:56:02.999582Z", "loop": 1533, "env_steps": 942489599, "loss": 0.003680712776258588, "avg_return": 0.4432724714279175, "regret": 0.35868796706199646, "entropy": 0.16948378086090088, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:56:04.158383Z", "loop": 1534, "env_steps": 943103999, "loss": 0.0035628408659249544, "avg_return": 0.450653076171875, "regret": 0.35868796706199646, "entropy": 0.17119179666042328, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:56:05.363972Z", "loop": 1535, "env_steps": 943718399, "loss": 0.0035274624824523926, "avg_return": 0.45059359073638916, "regret": 0.3587278127670288, "entropy": 0.15973368287086487, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:56:06.524765Z", "loop": 1536, "env_steps": 944332799, "loss": 0.003321949392557144, "avg_return": 0.45234715938568115, "regret": 0.3587278127670288, "entropy": 0.15867936611175537, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:56:07.685321Z", "loop": 1537, "env_steps": 944947199, "loss": 0.0032140107359737158, "avg_return": 0.4479929208755493, "regret": 0.3587278127670288, "entropy": 0.1535572111606598, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:56:08.843313Z", "loop": 1538, "env_steps": 945561599, "loss": 0.0030360075179487467, "avg_return": 0.44293212890625, "regret": 0.3587278127670288, "entropy": 0.1481866091489792, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:56:10.002344Z", "loop": 1539, "env_steps": 946175999, "loss": 0.003151204902678728, "avg_return": 0.4454423189163208, "regret": 0.3587278127670288, "entropy": 0.14790555834770203, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:56:11.205451Z", "loop": 1540, "env_steps": 946790399, "loss": 0.0033726077526807785, "avg_return": 0.44061365723609924, "regret": 0.36245933175086975, "entropy": 0.148819237947464, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:56:12.366307Z", "loop": 1541, "env_steps": 947404799, "loss": 0.003468823852017522, "avg_return": 0.4421801269054413, "regret": 0.36245933175086975, "entropy": 0.1571406126022339, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:56:13.525459Z", "loop": 1542, "env_steps": 948019199, "loss": 0.0036214578431099653, "avg_return": 0.43864086270332336, "regret": 0.36245933175086975, "entropy": 0.151298388838768, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:56:14.684782Z", "loop": 1543, "env_steps": 948633599, "loss": 0.0038332745898514986, "avg_return": 0.4366065561771393, "regret": 0.36245933175086975, "entropy": 0.15217889845371246, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:56:15.843141Z", "loop": 1544, "env_steps": 949247999, "loss": 0.0037617485504597425, "avg_return": 0.4402672350406647, "regret": 0.36245933175086975, "entropy": 0.1515568494796753, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:56:17.045890Z", "loop": 1545, "env_steps": 949862399, "loss": 0.0033024100121110678, "avg_return": 0.4321846663951874, "regret": 0.3665902018547058, "entropy": 0.15009616315364838, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:56:18.205373Z", "loop": 1546, "env_steps": 950476799, "loss": 0.0033993662800639868, "avg_return": 0.432596355676651, "regret": 0.3665902018547058, "entropy": 0.1440104991197586, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:56:19.365885Z", "loop": 1547, "env_steps": 951091199, "loss": 0.0036377261858433485, "avg_return": 0.441107839345932, "regret": 0.3665902018547058, "entropy": 0.14999155700206757, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:56:20.524584Z", "loop": 1548, "env_steps": 951705599, "loss": 0.0035550480242818594, "avg_return": 0.43457815051078796, "regret": 0.3665902018547058, "entropy": 0.14837691187858582, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:56:21.684214Z", "loop": 1549, "env_steps": 952319999, "loss": 0.0035285805352032185, "avg_return": 0.4453352093696594, "regret": 0.3665902018547058, "entropy": 0.1558787226676941, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:56:22.888075Z", "loop": 1550, "env_steps": 952934399, "loss": 0.0036134112160652876, "avg_return": 0.4415495991706848, "regret": 0.3602672219276428, "entropy": 0.1608380377292633, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:56:24.051286Z", "loop": 1551, "env_steps": 953548799, "loss": 0.0032364351209253073, "avg_return": 0.44474300742149353, "regret": 0.3602672219276428, "entropy": 0.15020500123500824, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:56:25.210447Z", "loop": 1552, "env_steps": 954163199, "loss": 0.0031264224089682102, "avg_return": 0.4397086799144745, "regret": 0.3602672219276428, "entropy": 0.15932735800743103, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:56:26.369272Z", "loop": 1553, "env_steps": 954777599, "loss": 0.0035634320229291916, "avg_return": 0.4463999569416046, "regret": 0.3602672219276428, "entropy": 0.1648445576429367, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:56:27.529074Z", "loop": 1554, "env_steps": 955391999, "loss": 0.004041220527142286, "avg_return": 0.4482490122318268, "regret": 0.3602672219276428, "entropy": 0.17543749511241913, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:56:28.737918Z", "loop": 1555, "env_steps": 956006399, "loss": 0.003995911683887243, "avg_return": 0.4467785656452179, "regret": 0.35806024074554443, "entropy": 0.18779705464839935, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:56:29.899811Z", "loop": 1556, "env_steps": 956620799, "loss": 0.003931458108127117, "avg_return": 0.4434731602668762, "regret": 0.35806024074554443, "entropy": 0.17676237225532532, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:56:31.059765Z", "loop": 1557, "env_steps": 957235199, "loss": 0.004189594648778439, "avg_return": 0.4412347078323364, "regret": 0.35806024074554443, "entropy": 0.1878870129585266, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:56:32.218606Z", "loop": 1558, "env_steps": 957849599, "loss": 0.004175473004579544, "avg_return": 0.4383302927017212, "regret": 0.35806024074554443, "entropy": 0.1823156774044037, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:56:33.379328Z", "loop": 1559, "env_steps": 958463999, "loss": 0.004243189003318548, "avg_return": 0.4399392902851105, "regret": 0.35806024074554443, "entropy": 0.1833457052707672, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:56:34.586639Z", "loop": 1560, "env_steps": 959078399, "loss": 0.004151587374508381, "avg_return": 0.43754833936691284, "regret": 0.3616524338722229, "entropy": 0.18938812613487244, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:56:35.747563Z", "loop": 1561, "env_steps": 959692799, "loss": 0.003943211864680052, "avg_return": 0.4355815351009369, "regret": 0.3616524338722229, "entropy": 0.18123140931129456, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:56:36.907120Z", "loop": 1562, "env_steps": 960307199, "loss": 0.004296738188713789, "avg_return": 0.4420221447944641, "regret": 0.3616524338722229, "entropy": 0.18056072294712067, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:56:38.068357Z", "loop": 1563, "env_steps": 960921599, "loss": 0.0043970500119030476, "avg_return": 0.44399526715278625, "regret": 0.3616524338722229, "entropy": 0.1825219988822937, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:56:39.229505Z", "loop": 1564, "env_steps": 961535999, "loss": 0.004171903245151043, "avg_return": 0.4351494312286377, "regret": 0.3616524338722229, "entropy": 0.18391937017440796, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:56:40.435298Z", "loop": 1565, "env_steps": 962150399, "loss": 0.004393117036670446, "avg_return": 0.44740748405456543, "regret": 0.3592347800731659, "entropy": 0.18513737618923187, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:56:41.595267Z", "loop": 1566, "env_steps": 962764799, "loss": 0.0040539843030273914, "avg_return": 0.44020652770996094, "regret": 0.3592347800731659, "entropy": 0.19054469466209412, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:56:42.755993Z", "loop": 1567, "env_steps": 963379199, "loss": 0.0040307133458554745, "avg_return": 0.4487994611263275, "regret": 0.3592347800731659, "entropy": 0.1768878996372223, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:56:43.917685Z", "loop": 1568, "env_steps": 963993599, "loss": 0.0038558233063668013, "avg_return": 0.44183728098869324, "regret": 0.3592347800731659, "entropy": 0.17714889347553253, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:56:45.083441Z", "loop": 1569, "env_steps": 964607999, "loss": 0.0037011594977229834, "avg_return": 0.44033151865005493, "regret": 0.3592347800731659, "entropy": 0.17377415299415588, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:56:46.291061Z", "loop": 1570, "env_steps": 965222399, "loss": 0.0033118475694209337, "avg_return": 0.4516853988170624, "regret": 0.3579496741294861, "entropy": 0.16407497227191925, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:56:47.450504Z", "loop": 1571, "env_steps": 965836799, "loss": 0.0031499837059527636, "avg_return": 0.4458600878715515, "regret": 0.3579496741294861, "entropy": 0.17173555493354797, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:56:48.610836Z", "loop": 1572, "env_steps": 966451199, "loss": 0.0033306588884443045, "avg_return": 0.4449584186077118, "regret": 0.3579496741294861, "entropy": 0.15939366817474365, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:56:49.771161Z", "loop": 1573, "env_steps": 967065599, "loss": 0.0036145285703241825, "avg_return": 0.44147664308547974, "regret": 0.3579496741294861, "entropy": 0.15722313523292542, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:56:50.932098Z", "loop": 1574, "env_steps": 967679999, "loss": 0.003471003146842122, "avg_return": 0.4418540596961975, "regret": 0.3579496741294861, "entropy": 0.16310866177082062, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:56:52.136991Z", "loop": 1575, "env_steps": 968294399, "loss": 0.003817850025370717, "avg_return": 0.4482489228248596, "regret": 0.3592352271080017, "entropy": 0.1640133261680603, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:56:53.299215Z", "loop": 1576, "env_steps": 968908799, "loss": 0.0036058095283806324, "avg_return": 0.44722646474838257, "regret": 0.3592352271080017, "entropy": 0.16194987297058105, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:56:54.460324Z", "loop": 1577, "env_steps": 969523199, "loss": 0.003277732525020838, "avg_return": 0.4481866955757141, "regret": 0.3592352271080017, "entropy": 0.1624557375907898, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:56:55.622507Z", "loop": 1578, "env_steps": 970137599, "loss": 0.0034152206499129534, "avg_return": 0.4398307502269745, "regret": 0.3592352271080017, "entropy": 0.1617657095193863, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:56:56.789273Z", "loop": 1579, "env_steps": 970751999, "loss": 0.002879678038880229, "avg_return": 0.4463554918766022, "regret": 0.3592352271080017, "entropy": 0.1558510810136795, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:56:58.002337Z", "loop": 1580, "env_steps": 971366399, "loss": 0.003397309919819236, "avg_return": 0.44606831669807434, "regret": 0.35766348242759705, "entropy": 0.15692105889320374, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:56:59.171004Z", "loop": 1581, "env_steps": 971980799, "loss": 0.0032890464644879103, "avg_return": 0.4472337067127228, "regret": 0.35766348242759705, "entropy": 0.16307714581489563, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:57:00.329893Z", "loop": 1582, "env_steps": 972595199, "loss": 0.0035299554001539946, "avg_return": 0.4472246468067169, "regret": 0.35766348242759705, "entropy": 0.16003558039665222, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:57:01.490035Z", "loop": 1583, "env_steps": 973209599, "loss": 0.0034405626356601715, "avg_return": 0.44970306754112244, "regret": 0.35766348242759705, "entropy": 0.1631453037261963, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:57:02.649299Z", "loop": 1584, "env_steps": 973823999, "loss": 0.003492998657748103, "avg_return": 0.44973236322402954, "regret": 0.35766348242759705, "entropy": 0.16136710345745087, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:57:03.855082Z", "loop": 1585, "env_steps": 974438399, "loss": 0.003273200010880828, "avg_return": 0.44291922450065613, "regret": 0.35750579833984375, "entropy": 0.16060547530651093, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:57:05.019610Z", "loop": 1586, "env_steps": 975052799, "loss": 0.0034577397163957357, "avg_return": 0.44714102149009705, "regret": 0.35750579833984375, "entropy": 0.1608985960483551, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:57:06.182551Z", "loop": 1587, "env_steps": 975667199, "loss": 0.0034244402777403593, "avg_return": 0.44190266728401184, "regret": 0.35750579833984375, "entropy": 0.1529662013053894, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:57:07.343190Z", "loop": 1588, "env_steps": 976281599, "loss": 0.0032163397409021854, "avg_return": 0.4544552266597748, "regret": 0.35750579833984375, "entropy": 0.16109749674797058, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:57:08.504354Z", "loop": 1589, "env_steps": 976895999, "loss": 0.0037914738059043884, "avg_return": 0.44846493005752563, "regret": 0.35750579833984375, "entropy": 0.16665589809417725, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:57:09.710670Z", "loop": 1590, "env_steps": 977510399, "loss": 0.0043239593505859375, "avg_return": 0.450632244348526, "regret": 0.3575083911418915, "entropy": 0.17072491347789764, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:57:10.871352Z", "loop": 1591, "env_steps": 978124799, "loss": 0.004077370744198561, "avg_return": 0.451741099357605, "regret": 0.3575083911418915, "entropy": 0.16789433360099792, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:57:12.030481Z", "loop": 1592, "env_steps": 978739199, "loss": 0.0039059051778167486, "avg_return": 0.4524783492088318, "regret": 0.3575083911418915, "entropy": 0.16438955068588257, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:57:13.190907Z", "loop": 1593, "env_steps": 979353599, "loss": 0.0034432930406183004, "avg_return": 0.4449281394481659, "regret": 0.3575083911418915, "entropy": 0.16738790273666382, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:57:14.350205Z", "loop": 1594, "env_steps": 979967999, "loss": 0.003663117764517665, "avg_return": 0.4413531720638275, "regret": 0.3575083911418915, "entropy": 0.1688096821308136, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:57:15.554330Z", "loop": 1595, "env_steps": 980582399, "loss": 0.003925762604922056, "avg_return": 0.44477325677871704, "regret": 0.3573484718799591, "entropy": 0.16966935992240906, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:57:16.714452Z", "loop": 1596, "env_steps": 981196799, "loss": 0.0034796111285686493, "avg_return": 0.44610992074012756, "regret": 0.3573484718799591, "entropy": 0.16667062044143677, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:57:17.879373Z", "loop": 1597, "env_steps": 981811199, "loss": 0.003763379994779825, "avg_return": 0.4432818293571472, "regret": 0.3573484718799591, "entropy": 0.16224436461925507, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:57:19.041315Z", "loop": 1598, "env_steps": 982425599, "loss": 0.003670609788969159, "avg_return": 0.44890260696411133, "regret": 0.3573484718799591, "entropy": 0.16529212892055511, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:57:20.201702Z", "loop": 1599, "env_steps": 983039999, "loss": 0.0038636724930256605, "avg_return": 0.4471510052680969, "regret": 0.3573484718799591, "entropy": 0.16441549360752106, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:57:21.409350Z", "loop": 1600, "env_steps": 983654399, "loss": 0.0037411977536976337, "avg_return": 0.44562938809394836, "regret": 0.357310950756073, "entropy": 0.1705268770456314, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:57:22.570369Z", "loop": 1601, "env_steps": 984268799, "loss": 0.003973182290792465, "avg_return": 0.44892996549606323, "regret": 0.357310950756073, "entropy": 0.16586953401565552, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:57:23.729315Z", "loop": 1602, "env_steps": 984883199, "loss": 0.004306397866457701, "avg_return": 0.4433775842189789, "regret": 0.357310950756073, "entropy": 0.17091961205005646, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:57:24.888707Z", "loop": 1603, "env_steps": 985497599, "loss": 0.0036936518736183643, "avg_return": 0.44814997911453247, "regret": 0.357310950756073, "entropy": 0.17262189090251923, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:57:26.048839Z", "loop": 1604, "env_steps": 986111999, "loss": 0.004709139931946993, "avg_return": 0.4468960762023926, "regret": 0.357310950756073, "entropy": 0.1594567745923996, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:57:27.251778Z", "loop": 1605, "env_steps": 986726399, "loss": 0.004267171025276184, "avg_return": 0.4438891112804413, "regret": 0.3603118360042572, "entropy": 0.15478894114494324, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:57:28.412030Z", "loop": 1606, "env_steps": 987340799, "loss": 0.004636743105947971, "avg_return": 0.44150713086128235, "regret": 0.3603118360042572, "entropy": 0.15659199655056, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:57:29.572594Z", "loop": 1607, "env_steps": 987955199, "loss": 0.004549603909254074, "avg_return": 0.44154807925224304, "regret": 0.3603118360042572, "entropy": 0.156270831823349, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:57:30.737119Z", "loop": 1608, "env_steps": 988569599, "loss": 0.004614512901753187, "avg_return": 0.4453880488872528, "regret": 0.3603118360042572, "entropy": 0.15611876547336578, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:57:31.895724Z", "loop": 1609, "env_steps": 989183999, "loss": 0.004158707335591316, "avg_return": 0.4439311921596527, "regret": 0.3603118360042572, "entropy": 0.15943235158920288, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:57:33.098861Z", "loop": 1610, "env_steps": 989798399, "loss": 0.004385951440781355, "avg_return": 0.43889710307121277, "regret": 0.35918718576431274, "entropy": 0.15568317472934723, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:57:34.258396Z", "loop": 1611, "env_steps": 990412799, "loss": 0.004018415231257677, "avg_return": 0.445500910282135, "regret": 0.35918718576431274, "entropy": 0.1601613461971283, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:57:35.419354Z", "loop": 1612, "env_steps": 991027199, "loss": 0.00400911970064044, "avg_return": 0.444467693567276, "regret": 0.35918718576431274, "entropy": 0.159645214676857, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:57:36.578391Z", "loop": 1613, "env_steps": 991641599, "loss": 0.0038319285959005356, "avg_return": 0.4452914595603943, "regret": 0.35918718576431274, "entropy": 0.16107289493083954, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:57:37.738701Z", "loop": 1614, "env_steps": 992255999, "loss": 0.003052422543987632, "avg_return": 0.44215598702430725, "regret": 0.35918718576431274, "entropy": 0.15119203925132751, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:57:38.941795Z", "loop": 1615, "env_steps": 992870399, "loss": 0.0028793474193662405, "avg_return": 0.4520087242126465, "regret": 0.35832616686820984, "entropy": 0.14312711358070374, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:57:40.102210Z", "loop": 1616, "env_steps": 993484799, "loss": 0.0025364418979734182, "avg_return": 0.44005289673805237, "regret": 0.35832616686820984, "entropy": 0.13285721838474274, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:57:41.261643Z", "loop": 1617, "env_steps": 994099199, "loss": 0.0021440715063363314, "avg_return": 0.4409410059452057, "regret": 0.35832616686820984, "entropy": 0.1311904639005661, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:57:42.421985Z", "loop": 1618, "env_steps": 994713599, "loss": 0.002502470277249813, "avg_return": 0.4412665367126465, "regret": 0.35832616686820984, "entropy": 0.13558223843574524, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:57:43.581437Z", "loop": 1619, "env_steps": 995327999, "loss": 0.0025197621434926987, "avg_return": 0.4418867230415344, "regret": 0.35832616686820984, "entropy": 0.13349102437496185, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:57:44.793666Z", "loop": 1620, "env_steps": 995942399, "loss": 0.002045254921540618, "avg_return": 0.4468645751476288, "regret": 0.36016613245010376, "entropy": 0.1313340663909912, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:57:45.952102Z", "loop": 1621, "env_steps": 996556799, "loss": 0.0025590138975530863, "avg_return": 0.43603241443634033, "regret": 0.36016613245010376, "entropy": 0.1353081464767456, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:57:47.112535Z", "loop": 1622, "env_steps": 997171199, "loss": 0.002321538981050253, "avg_return": 0.4458227753639221, "regret": 0.36016613245010376, "entropy": 0.12835516035556793, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:57:48.271848Z", "loop": 1623, "env_steps": 997785599, "loss": 0.0019969940185546875, "avg_return": 0.4394289255142212, "regret": 0.36016613245010376, "entropy": 0.13461117446422577, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:57:49.431232Z", "loop": 1624, "env_steps": 998399999, "loss": 0.0023617499973624945, "avg_return": 0.4462994933128357, "regret": 0.36016613245010376, "entropy": 0.13532927632331848, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:57:50.634044Z", "loop": 1625, "env_steps": 999014399, "loss": 0.002415451453998685, "avg_return": 0.4474148750305176, "regret": 0.35931411385536194, "entropy": 0.13307088613510132, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:57:51.794244Z", "loop": 1626, "env_steps": 999628799, "loss": 0.0029499807860702276, "avg_return": 0.4465525448322296, "regret": 0.35931411385536194, "entropy": 0.1399764120578766, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:57:52.954073Z", "loop": 1627, "env_steps": 1000243199, "loss": 0.002965410938486457, "avg_return": 0.4432511627674103, "regret": 0.35931411385536194, "entropy": 0.14036129415035248, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:57:54.115245Z", "loop": 1628, "env_steps": 1000857599, "loss": 0.0029826073441654444, "avg_return": 0.44995617866516113, "regret": 0.35931411385536194, "entropy": 0.14553207159042358, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:57:55.274474Z", "loop": 1629, "env_steps": 1001471999, "loss": 0.003065472235903144, "avg_return": 0.45441803336143494, "regret": 0.35931411385536194, "entropy": 0.14222896099090576, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:57:56.478431Z", "loop": 1630, "env_steps": 1002086399, "loss": 0.0028931773267686367, "avg_return": 0.44580790400505066, "regret": 0.3581876754760742, "entropy": 0.14437848329544067, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:57:57.640064Z", "loop": 1631, "env_steps": 1002700799, "loss": 0.002827811287716031, "avg_return": 0.4475477635860443, "regret": 0.3581876754760742, "entropy": 0.1426318734884262, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:57:58.800409Z", "loop": 1632, "env_steps": 1003315199, "loss": 0.0028183094691485167, "avg_return": 0.4466017782688141, "regret": 0.3581876754760742, "entropy": 0.14263196289539337, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:57:59.960903Z", "loop": 1633, "env_steps": 1003929599, "loss": 0.0026434988249093294, "avg_return": 0.45017901062965393, "regret": 0.3581876754760742, "entropy": 0.14279502630233765, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:58:01.122098Z", "loop": 1634, "env_steps": 1004543999, "loss": 0.0027968757785856724, "avg_return": 0.4490916132926941, "regret": 0.3581876754760742, "entropy": 0.15039227902889252, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:58:02.326814Z", "loop": 1635, "env_steps": 1005158399, "loss": 0.0030169219244271517, "avg_return": 0.4536517560482025, "regret": 0.35757964849472046, "entropy": 0.1459730863571167, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:58:03.486850Z", "loop": 1636, "env_steps": 1005772799, "loss": 0.003214069176465273, "avg_return": 0.4441404342651367, "regret": 0.35757964849472046, "entropy": 0.15452608466148376, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:58:04.646131Z", "loop": 1637, "env_steps": 1006387199, "loss": 0.003604662837460637, "avg_return": 0.44596773386001587, "regret": 0.35757964849472046, "entropy": 0.15936368703842163, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:58:05.806262Z", "loop": 1638, "env_steps": 1007001599, "loss": 0.003479397390037775, "avg_return": 0.4520706236362457, "regret": 0.35757964849472046, "entropy": 0.15925058722496033, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:58:06.966330Z", "loop": 1639, "env_steps": 1007615999, "loss": 0.0034256496001034975, "avg_return": 0.4518432319164276, "regret": 0.35757964849472046, "entropy": 0.16014227271080017, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:58:08.170161Z", "loop": 1640, "env_steps": 1008230399, "loss": 0.0037041634786874056, "avg_return": 0.4497871398925781, "regret": 0.35679054260253906, "entropy": 0.17099803686141968, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:58:09.330661Z", "loop": 1641, "env_steps": 1008844799, "loss": 0.004336247220635414, "avg_return": 0.45442643761634827, "regret": 0.35679054260253906, "entropy": 0.16114594042301178, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:58:10.491035Z", "loop": 1642, "env_steps": 1009459199, "loss": 0.004203666001558304, "avg_return": 0.44983428716659546, "regret": 0.35679054260253906, "entropy": 0.1655728816986084, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:58:11.650642Z", "loop": 1643, "env_steps": 1010073599, "loss": 0.0038741964381188154, "avg_return": 0.4417034089565277, "regret": 0.35679054260253906, "entropy": 0.16876105964183807, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:58:12.810449Z", "loop": 1644, "env_steps": 1010687999, "loss": 0.004028134047985077, "avg_return": 0.45348507165908813, "regret": 0.35679054260253906, "entropy": 0.16553618013858795, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:58:14.020646Z", "loop": 1645, "env_steps": 1011302399, "loss": 0.003804632229730487, "avg_return": 0.44396814703941345, "regret": 0.35679104924201965, "entropy": 0.16791582107543945, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:58:15.185362Z", "loop": 1646, "env_steps": 1011916799, "loss": 0.004445727448910475, "avg_return": 0.4512600302696228, "regret": 0.35679104924201965, "entropy": 0.1628035306930542, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:58:16.345130Z", "loop": 1647, "env_steps": 1012531199, "loss": 0.004132797475904226, "avg_return": 0.4464021921157837, "regret": 0.35679104924201965, "entropy": 0.16946549713611603, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:58:17.505210Z", "loop": 1648, "env_steps": 1013145599, "loss": 0.003534536575898528, "avg_return": 0.45102185010910034, "regret": 0.35679104924201965, "entropy": 0.17063243687152863, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:58:18.666378Z", "loop": 1649, "env_steps": 1013759999, "loss": 0.0038807683158665895, "avg_return": 0.4446480870246887, "regret": 0.35679104924201965, "entropy": 0.163395956158638, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:58:19.871775Z", "loop": 1650, "env_steps": 1014374399, "loss": 0.003220687387511134, "avg_return": 0.4436786472797394, "regret": 0.3567921817302704, "entropy": 0.1553068608045578, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:58:21.034245Z", "loop": 1651, "env_steps": 1014988799, "loss": 0.002590443007647991, "avg_return": 0.44702181220054626, "regret": 0.3567921817302704, "entropy": 0.13748325407505035, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:58:22.194426Z", "loop": 1652, "env_steps": 1015603199, "loss": 0.002888672286644578, "avg_return": 0.44522857666015625, "regret": 0.3567921817302704, "entropy": 0.14384686946868896, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:58:23.355290Z", "loop": 1653, "env_steps": 1016217599, "loss": 0.0034577168989926577, "avg_return": 0.44503581523895264, "regret": 0.3567921817302704, "entropy": 0.15686210989952087, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:58:24.514386Z", "loop": 1654, "env_steps": 1016831999, "loss": 0.0034041290637105703, "avg_return": 0.43748098611831665, "regret": 0.3567921817302704, "entropy": 0.1503141224384308, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:58:25.721147Z", "loop": 1655, "env_steps": 1017446399, "loss": 0.003335376037284732, "avg_return": 0.4453147351741791, "regret": 0.36194145679473877, "entropy": 0.14560432732105255, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:58:26.888204Z", "loop": 1656, "env_steps": 1018060799, "loss": 0.0032160754781216383, "avg_return": 0.4381786286830902, "regret": 0.36194145679473877, "entropy": 0.1510135680437088, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:58:28.048952Z", "loop": 1657, "env_steps": 1018675199, "loss": 0.0033022568095475435, "avg_return": 0.44181016087532043, "regret": 0.36194145679473877, "entropy": 0.1457674354314804, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:58:29.209985Z", "loop": 1658, "env_steps": 1019289599, "loss": 0.0028345114551484585, "avg_return": 0.44557058811187744, "regret": 0.36194145679473877, "entropy": 0.13659511506557465, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:58:30.371734Z", "loop": 1659, "env_steps": 1019903999, "loss": 0.0025415215641260147, "avg_return": 0.4470241367816925, "regret": 0.36194145679473877, "entropy": 0.1387042999267578, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:58:31.577426Z", "loop": 1660, "env_steps": 1020518399, "loss": 0.0024257090408354998, "avg_return": 0.44287317991256714, "regret": 0.35744959115982056, "entropy": 0.14048539102077484, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:58:32.738161Z", "loop": 1661, "env_steps": 1021132799, "loss": 0.0029366090893745422, "avg_return": 0.45221903920173645, "regret": 0.35744959115982056, "entropy": 0.15064488351345062, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:58:33.897786Z", "loop": 1662, "env_steps": 1021747199, "loss": 0.0036604616325348616, "avg_return": 0.4541443884372711, "regret": 0.35744959115982056, "entropy": 0.16078534722328186, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:58:35.059771Z", "loop": 1663, "env_steps": 1022361599, "loss": 0.0034196414053440094, "avg_return": 0.4454698860645294, "regret": 0.35744959115982056, "entropy": 0.17070089280605316, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:58:36.220513Z", "loop": 1664, "env_steps": 1022975999, "loss": 0.00428728386759758, "avg_return": 0.45226508378982544, "regret": 0.35744959115982056, "entropy": 0.17499594390392303, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:58:37.426637Z", "loop": 1665, "env_steps": 1023590399, "loss": 0.004711078014224768, "avg_return": 0.4478875696659088, "regret": 0.35627079010009766, "entropy": 0.1710994988679886, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:58:38.586510Z", "loop": 1666, "env_steps": 1024204799, "loss": 0.004231944214552641, "avg_return": 0.44461676478385925, "regret": 0.35627079010009766, "entropy": 0.16696393489837646, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:58:39.746524Z", "loop": 1667, "env_steps": 1024819199, "loss": 0.0040415492840111256, "avg_return": 0.44598695635795593, "regret": 0.35627079010009766, "entropy": 0.15965856611728668, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:58:40.906174Z", "loop": 1668, "env_steps": 1025433599, "loss": 0.004330847878009081, "avg_return": 0.4533642828464508, "regret": 0.35627079010009766, "entropy": 0.15886788070201874, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:58:42.065980Z", "loop": 1669, "env_steps": 1026047999, "loss": 0.004621039144694805, "avg_return": 0.455059677362442, "regret": 0.35627079010009766, "entropy": 0.1575012505054474, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:58:43.270350Z", "loop": 1670, "env_steps": 1026662399, "loss": 0.0046648201532661915, "avg_return": 0.4442436695098877, "regret": 0.3564004898071289, "entropy": 0.15721051394939423, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:58:44.432144Z", "loop": 1671, "env_steps": 1027276799, "loss": 0.003928651567548513, "avg_return": 0.4478899836540222, "regret": 0.3564004898071289, "entropy": 0.15882600843906403, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:58:45.591241Z", "loop": 1672, "env_steps": 1027891199, "loss": 0.003903232282027602, "avg_return": 0.44839560985565186, "regret": 0.3564004898071289, "entropy": 0.15534141659736633, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:58:46.750962Z", "loop": 1673, "env_steps": 1028505599, "loss": 0.0041870251297950745, "avg_return": 0.45041993260383606, "regret": 0.3564004898071289, "entropy": 0.16390883922576904, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:58:47.912196Z", "loop": 1674, "env_steps": 1029119999, "loss": 0.004371559713035822, "avg_return": 0.44551271200180054, "regret": 0.3564004898071289, "entropy": 0.16337910294532776, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:58:49.116179Z", "loop": 1675, "env_steps": 1029734399, "loss": 0.004283887799829245, "avg_return": 0.4465889036655426, "regret": 0.35640764236450195, "entropy": 0.1565486639738083, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:58:50.275442Z", "loop": 1676, "env_steps": 1030348799, "loss": 0.003734383499249816, "avg_return": 0.4461294710636139, "regret": 0.35640764236450195, "entropy": 0.15162642300128937, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:58:51.435465Z", "loop": 1677, "env_steps": 1030963199, "loss": 0.004160746466368437, "avg_return": 0.44842246174812317, "regret": 0.35640764236450195, "entropy": 0.15316042304039001, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:58:52.594503Z", "loop": 1678, "env_steps": 1031577599, "loss": 0.004729985725134611, "avg_return": 0.44749096035957336, "regret": 0.35640764236450195, "entropy": 0.15536127984523773, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:58:53.754165Z", "loop": 1679, "env_steps": 1032191999, "loss": 0.004259039647877216, "avg_return": 0.45093822479248047, "regret": 0.35640764236450195, "entropy": 0.15346775949001312, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:58:54.958447Z", "loop": 1680, "env_steps": 1032806399, "loss": 0.003908826038241386, "avg_return": 0.44293320178985596, "regret": 0.3564797341823578, "entropy": 0.15292222797870636, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:58:56.119390Z", "loop": 1681, "env_steps": 1033420799, "loss": 0.004465589765459299, "avg_return": 0.4551568329334259, "regret": 0.3564797341823578, "entropy": 0.15567369759082794, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:58:57.279266Z", "loop": 1682, "env_steps": 1034035199, "loss": 0.004135779570788145, "avg_return": 0.44594046473503113, "regret": 0.3564797341823578, "entropy": 0.14976686239242554, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:58:58.439456Z", "loop": 1683, "env_steps": 1034649599, "loss": 0.0044838241301476955, "avg_return": 0.4486580491065979, "regret": 0.3564797341823578, "entropy": 0.14581890404224396, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:58:59.600949Z", "loop": 1684, "env_steps": 1035263999, "loss": 0.004455419257283211, "avg_return": 0.44926849007606506, "regret": 0.3564797341823578, "entropy": 0.14409933984279633, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:59:00.806846Z", "loop": 1685, "env_steps": 1035878399, "loss": 0.00444995891302824, "avg_return": 0.44708508253097534, "regret": 0.3568269908428192, "entropy": 0.151622012257576, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:59:01.969311Z", "loop": 1686, "env_steps": 1036492799, "loss": 0.005058696493506432, "avg_return": 0.43543529510498047, "regret": 0.3568269908428192, "entropy": 0.15387870371341705, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:59:03.130007Z", "loop": 1687, "env_steps": 1037107199, "loss": 0.0052276733331382275, "avg_return": 0.44720348715782166, "regret": 0.3568269908428192, "entropy": 0.15644118189811707, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:59:04.291838Z", "loop": 1688, "env_steps": 1037721599, "loss": 0.004831635393202305, "avg_return": 0.4431983530521393, "regret": 0.3568269908428192, "entropy": 0.14871928095817566, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:59:05.452622Z", "loop": 1689, "env_steps": 1038335999, "loss": 0.00465810252353549, "avg_return": 0.4289068281650543, "regret": 0.3568269908428192, "entropy": 0.15252694487571716, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:59:06.658611Z", "loop": 1690, "env_steps": 1038950399, "loss": 0.004835030063986778, "avg_return": 0.4389653503894806, "regret": 0.36388567090034485, "entropy": 0.14649315178394318, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:59:07.821633Z", "loop": 1691, "env_steps": 1039564799, "loss": 0.00493901502341032, "avg_return": 0.44433411955833435, "regret": 0.36388567090034485, "entropy": 0.14883653819561005, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:59:08.983170Z", "loop": 1692, "env_steps": 1040179199, "loss": 0.004671093076467514, "avg_return": 0.4420434534549713, "regret": 0.36388567090034485, "entropy": 0.14914065599441528, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:59:10.143223Z", "loop": 1693, "env_steps": 1040793599, "loss": 0.004718105774372816, "avg_return": 0.44336366653442383, "regret": 0.36388567090034485, "entropy": 0.1567697376012802, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:59:11.304371Z", "loop": 1694, "env_steps": 1041407999, "loss": 0.00478989677503705, "avg_return": 0.45074179768562317, "regret": 0.36388567090034485, "entropy": 0.1551385223865509, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:59:12.511472Z", "loop": 1695, "env_steps": 1042022399, "loss": 0.004539910238236189, "avg_return": 0.4503336548805237, "regret": 0.35599103569984436, "entropy": 0.14770598709583282, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:59:13.672613Z", "loop": 1696, "env_steps": 1042636799, "loss": 0.003944248426705599, "avg_return": 0.44245073199272156, "regret": 0.35599103569984436, "entropy": 0.15879730880260468, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:59:14.832544Z", "loop": 1697, "env_steps": 1043251199, "loss": 0.003899579169228673, "avg_return": 0.4444657564163208, "regret": 0.35599103569984436, "entropy": 0.16262106597423553, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:59:15.992450Z", "loop": 1698, "env_steps": 1043865599, "loss": 0.0035768335219472647, "avg_return": 0.4453165829181671, "regret": 0.35599103569984436, "entropy": 0.1600254774093628, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:59:17.153326Z", "loop": 1699, "env_steps": 1044479999, "loss": 0.003681850153952837, "avg_return": 0.4510480761528015, "regret": 0.35599103569984436, "entropy": 0.14842799305915833, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:59:18.361385Z", "loop": 1700, "env_steps": 1045094399, "loss": 0.0033882593270391226, "avg_return": 0.4417662024497986, "regret": 0.3561956286430359, "entropy": 0.15951472520828247, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:59:19.521823Z", "loop": 1701, "env_steps": 1045708799, "loss": 0.0034117475152015686, "avg_return": 0.44408971071243286, "regret": 0.3561956286430359, "entropy": 0.15525653958320618, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:59:20.681643Z", "loop": 1702, "env_steps": 1046323199, "loss": 0.0030636193696409464, "avg_return": 0.4368011951446533, "regret": 0.3561956286430359, "entropy": 0.14946258068084717, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:59:21.841428Z", "loop": 1703, "env_steps": 1046937599, "loss": 0.0029184266459196806, "avg_return": 0.4464830160140991, "regret": 0.3561956286430359, "entropy": 0.13973002135753632, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:59:23.003370Z", "loop": 1704, "env_steps": 1047551999, "loss": 0.0027524286415427923, "avg_return": 0.44640105962753296, "regret": 0.3561956286430359, "entropy": 0.14240428805351257, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:59:24.209305Z", "loop": 1705, "env_steps": 1048166399, "loss": 0.0026777703315019608, "avg_return": 0.4466868042945862, "regret": 0.3570922911167145, "entropy": 0.14176231622695923, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:59:25.371243Z", "loop": 1706, "env_steps": 1048780799, "loss": 0.002262688474729657, "avg_return": 0.4509742259979248, "regret": 0.3570922911167145, "entropy": 0.1376299411058426, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:59:26.530674Z", "loop": 1707, "env_steps": 1049395199, "loss": 0.0024535255506634712, "avg_return": 0.44773367047309875, "regret": 0.3570922911167145, "entropy": 0.13143044710159302, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:59:27.691172Z", "loop": 1708, "env_steps": 1050009599, "loss": 0.0023483941331505775, "avg_return": 0.45139843225479126, "regret": 0.3570922911167145, "entropy": 0.13103170692920685, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:59:28.852885Z", "loop": 1709, "env_steps": 1050623999, "loss": 0.0024224515073001385, "avg_return": 0.44932353496551514, "regret": 0.3570922911167145, "entropy": 0.12825828790664673, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:59:30.055789Z", "loop": 1710, "env_steps": 1051238399, "loss": 0.002183465287089348, "avg_return": 0.4534861445426941, "regret": 0.3578370213508606, "entropy": 0.12819957733154297, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:59:31.214959Z", "loop": 1711, "env_steps": 1051852799, "loss": 0.0021702039521187544, "avg_return": 0.4517911374568939, "regret": 0.3578370213508606, "entropy": 0.12616202235221863, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:59:32.375713Z", "loop": 1712, "env_steps": 1052467199, "loss": 0.0022364770993590355, "avg_return": 0.44168564677238464, "regret": 0.3578370213508606, "entropy": 0.13354243338108063, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:59:33.535930Z", "loop": 1713, "env_steps": 1053081599, "loss": 0.002119036391377449, "avg_return": 0.4467170834541321, "regret": 0.3578370213508606, "entropy": 0.1250712126493454, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:59:34.695553Z", "loop": 1714, "env_steps": 1053695999, "loss": 0.001948081306181848, "avg_return": 0.4446572959423065, "regret": 0.3578370213508606, "entropy": 0.1325555294752121, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:59:35.900335Z", "loop": 1715, "env_steps": 1054310399, "loss": 0.0020755366422235966, "avg_return": 0.44259029626846313, "regret": 0.35720571875572205, "entropy": 0.13237254321575165, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:59:37.062028Z", "loop": 1716, "env_steps": 1054924799, "loss": 0.0023451626766473055, "avg_return": 0.4504978656768799, "regret": 0.35720571875572205, "entropy": 0.13438761234283447, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:59:38.222640Z", "loop": 1717, "env_steps": 1055539199, "loss": 0.0024057391565293074, "avg_return": 0.44320347905158997, "regret": 0.35720571875572205, "entropy": 0.13884800672531128, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:59:39.383027Z", "loop": 1718, "env_steps": 1056153599, "loss": 0.0024992201942950487, "avg_return": 0.4452407956123352, "regret": 0.35720571875572205, "entropy": 0.1425447314977646, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:59:40.550344Z", "loop": 1719, "env_steps": 1056767999, "loss": 0.0024811921175569296, "avg_return": 0.4490033686161041, "regret": 0.35720571875572205, "entropy": 0.14648371934890747, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:59:41.759989Z", "loop": 1720, "env_steps": 1057382399, "loss": 0.002537535736337304, "avg_return": 0.4473517835140228, "regret": 0.35617125034332275, "entropy": 0.14106984436511993, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:59:42.922422Z", "loop": 1721, "env_steps": 1057996799, "loss": 0.002829218516126275, "avg_return": 0.44921448826789856, "regret": 0.35617125034332275, "entropy": 0.14546768367290497, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:59:44.086325Z", "loop": 1722, "env_steps": 1058611199, "loss": 0.002484843833371997, "avg_return": 0.44721487164497375, "regret": 0.35617125034332275, "entropy": 0.1460779905319214, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:59:45.247438Z", "loop": 1723, "env_steps": 1059225599, "loss": 0.002427035244181752, "avg_return": 0.44655758142471313, "regret": 0.35617125034332275, "entropy": 0.1299443393945694, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:59:46.408098Z", "loop": 1724, "env_steps": 1059839999, "loss": 0.0023018140345811844, "avg_return": 0.4518328011035919, "regret": 0.35617125034332275, "entropy": 0.13525335490703583, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:59:47.612752Z", "loop": 1725, "env_steps": 1060454399, "loss": 0.0020975989755243063, "avg_return": 0.44746309518814087, "regret": 0.35678234696388245, "entropy": 0.13406988978385925, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:59:48.776543Z", "loop": 1726, "env_steps": 1061068799, "loss": 0.002333597978577018, "avg_return": 0.4511713683605194, "regret": 0.35678234696388245, "entropy": 0.13418425619602203, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:59:49.936434Z", "loop": 1727, "env_steps": 1061683199, "loss": 0.002427635481581092, "avg_return": 0.4459269940853119, "regret": 0.35678234696388245, "entropy": 0.14342786371707916, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:59:51.094759Z", "loop": 1728, "env_steps": 1062297599, "loss": 0.0020794689189642668, "avg_return": 0.44727396965026855, "regret": 0.35678234696388245, "entropy": 0.14404551684856415, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:59:52.254068Z", "loop": 1729, "env_steps": 1062911999, "loss": 0.0025929741095751524, "avg_return": 0.44622209668159485, "regret": 0.35678234696388245, "entropy": 0.1398092657327652, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:59:53.461137Z", "loop": 1730, "env_steps": 1063526399, "loss": 0.002479461720213294, "avg_return": 0.44744282960891724, "regret": 0.35577747225761414, "entropy": 0.1348859816789627, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:59:54.620474Z", "loop": 1731, "env_steps": 1064140799, "loss": 0.00243437965400517, "avg_return": 0.4394962787628174, "regret": 0.35577747225761414, "entropy": 0.1516241431236267, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:59:55.779619Z", "loop": 1732, "env_steps": 1064755199, "loss": 0.003222814993932843, "avg_return": 0.45116063952445984, "regret": 0.35577747225761414, "entropy": 0.15061651170253754, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:59:56.939587Z", "loop": 1733, "env_steps": 1065369599, "loss": 0.0029583617579191923, "avg_return": 0.4441685676574707, "regret": 0.35577747225761414, "entropy": 0.1509544402360916, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:59:58.099885Z", "loop": 1734, "env_steps": 1065983999, "loss": 0.0027201359625905752, "avg_return": 0.4452051818370819, "regret": 0.35577747225761414, "entropy": 0.14901600778102875, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T21:59:59.303316Z", "loop": 1735, "env_steps": 1066598399, "loss": 0.0026690594386309385, "avg_return": 0.44932129979133606, "regret": 0.35518333315849304, "entropy": 0.14690063893795013, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:00:00.462561Z", "loop": 1736, "env_steps": 1067212799, "loss": 0.002557232743129134, "avg_return": 0.4552079439163208, "regret": 0.35518333315849304, "entropy": 0.14664135873317719, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:00:01.622094Z", "loop": 1737, "env_steps": 1067827199, "loss": 0.002388762077316642, "avg_return": 0.44627004861831665, "regret": 0.35518333315849304, "entropy": 0.14388832449913025, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:00:02.781080Z", "loop": 1738, "env_steps": 1068441599, "loss": 0.0024993373081088066, "avg_return": 0.4438663423061371, "regret": 0.35518333315849304, "entropy": 0.1567889302968979, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:00:03.941157Z", "loop": 1739, "env_steps": 1069055999, "loss": 0.0027049537748098373, "avg_return": 0.45501354336738586, "regret": 0.35518333315849304, "entropy": 0.1487070620059967, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:00:05.145121Z", "loop": 1740, "env_steps": 1069670399, "loss": 0.003127011004835367, "avg_return": 0.44989776611328125, "regret": 0.3544923961162567, "entropy": 0.15986602008342743, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:00:06.305205Z", "loop": 1741, "env_steps": 1070284799, "loss": 0.002935894764959812, "avg_return": 0.4466404318809509, "regret": 0.3544923961162567, "entropy": 0.16123069822788239, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:00:07.464431Z", "loop": 1742, "env_steps": 1070899199, "loss": 0.003717743558809161, "avg_return": 0.4413171410560608, "regret": 0.3544923961162567, "entropy": 0.1698112189769745, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:00:08.624204Z", "loop": 1743, "env_steps": 1071513599, "loss": 0.0036918085534125566, "avg_return": 0.44677385687828064, "regret": 0.3544923961162567, "entropy": 0.17218369245529175, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:00:09.785176Z", "loop": 1744, "env_steps": 1072127999, "loss": 0.003816076088696718, "avg_return": 0.44716694951057434, "regret": 0.3544923961162567, "entropy": 0.17487463355064392, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:00:10.988366Z", "loop": 1745, "env_steps": 1072742399, "loss": 0.003997426480054855, "avg_return": 0.45591890811920166, "regret": 0.35407882928848267, "entropy": 0.17651475965976715, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:00:12.147054Z", "loop": 1746, "env_steps": 1073356799, "loss": 0.004772154148668051, "avg_return": 0.4515615403652191, "regret": 0.35407882928848267, "entropy": 0.1910945028066635, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:00:13.308125Z", "loop": 1747, "env_steps": 1073971199, "loss": 0.004832754842936993, "avg_return": 0.4494171738624573, "regret": 0.35407882928848267, "entropy": 0.20508551597595215, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:00:14.468699Z", "loop": 1748, "env_steps": 1074585599, "loss": 0.005652416031807661, "avg_return": 0.44793081283569336, "regret": 0.35407882928848267, "entropy": 0.20919686555862427, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:00:15.628995Z", "loop": 1749, "env_steps": 1075199999, "loss": 0.005984016228467226, "avg_return": 0.45632457733154297, "regret": 0.35407882928848267, "entropy": 0.22402961552143097, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:00:16.834344Z", "loop": 1750, "env_steps": 1075814399, "loss": 0.0060937972739338875, "avg_return": 0.44072237610816956, "regret": 0.36442801356315613, "entropy": 0.22841273248195648, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:00:17.994339Z", "loop": 1751, "env_steps": 1076428799, "loss": 0.006449280772358179, "avg_return": 0.43929144740104675, "regret": 0.36442801356315613, "entropy": 0.22694970667362213, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:00:19.153891Z", "loop": 1752, "env_steps": 1077043199, "loss": 0.006508579012006521, "avg_return": 0.44578874111175537, "regret": 0.36442801356315613, "entropy": 0.21650318801403046, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:00:20.313855Z", "loop": 1753, "env_steps": 1077657599, "loss": 0.005685875192284584, "avg_return": 0.4458497166633606, "regret": 0.36442801356315613, "entropy": 0.21559709310531616, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:00:21.475425Z", "loop": 1754, "env_steps": 1078271999, "loss": 0.0053253453224897385, "avg_return": 0.44601115584373474, "regret": 0.36442801356315613, "entropy": 0.2087617963552475, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:00:22.679585Z", "loop": 1755, "env_steps": 1078886399, "loss": 0.00459551066160202, "avg_return": 0.45514002442359924, "regret": 0.3543749153614044, "entropy": 0.1874297708272934, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:00:23.840528Z", "loop": 1756, "env_steps": 1079500799, "loss": 0.0035089736338704824, "avg_return": 0.4422646164894104, "regret": 0.3543749153614044, "entropy": 0.17741785943508148, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:00:25.001849Z", "loop": 1757, "env_steps": 1080115199, "loss": 0.0032665354665368795, "avg_return": 0.4488923251628876, "regret": 0.3543749153614044, "entropy": 0.15931670367717743, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:00:26.164904Z", "loop": 1758, "env_steps": 1080729599, "loss": 0.002770138904452324, "avg_return": 0.44549185037612915, "regret": 0.3543749153614044, "entropy": 0.15406854450702667, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:00:27.325087Z", "loop": 1759, "env_steps": 1081343999, "loss": 0.0025023489724844694, "avg_return": 0.44954997301101685, "regret": 0.3543749153614044, "entropy": 0.1504022777080536, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:00:28.531166Z", "loop": 1760, "env_steps": 1081958399, "loss": 0.0026623595040291548, "avg_return": 0.44311362504959106, "regret": 0.35568782687187195, "entropy": 0.14308224618434906, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:00:29.691820Z", "loop": 1761, "env_steps": 1082572799, "loss": 0.002503836527466774, "avg_return": 0.44626399874687195, "regret": 0.35568782687187195, "entropy": 0.1492231786251068, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:00:30.853944Z", "loop": 1762, "env_steps": 1083187199, "loss": 0.0026013250462710857, "avg_return": 0.44679951667785645, "regret": 0.35568782687187195, "entropy": 0.1407448947429657, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:00:32.015299Z", "loop": 1763, "env_steps": 1083801599, "loss": 0.002684911945834756, "avg_return": 0.4414907395839691, "regret": 0.35568782687187195, "entropy": 0.14732743799686432, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:00:33.177354Z", "loop": 1764, "env_steps": 1084415999, "loss": 0.0031493648421019316, "avg_return": 0.44859275221824646, "regret": 0.35568782687187195, "entropy": 0.14306065440177917, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:00:34.381876Z", "loop": 1765, "env_steps": 1085030399, "loss": 0.002955450676381588, "avg_return": 0.449567973613739, "regret": 0.35710951685905457, "entropy": 0.14684639871120453, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:00:35.543728Z", "loop": 1766, "env_steps": 1085644799, "loss": 0.0028746244497597218, "avg_return": 0.4525120258331299, "regret": 0.35710951685905457, "entropy": 0.14621427655220032, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:00:36.707756Z", "loop": 1767, "env_steps": 1086259199, "loss": 0.0027432118076831102, "avg_return": 0.44553661346435547, "regret": 0.35710951685905457, "entropy": 0.14041367173194885, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:00:37.869025Z", "loop": 1768, "env_steps": 1086873599, "loss": 0.0024900934658944607, "avg_return": 0.4491859972476959, "regret": 0.35710951685905457, "entropy": 0.14444755017757416, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:00:39.028475Z", "loop": 1769, "env_steps": 1087487999, "loss": 0.002756736008450389, "avg_return": 0.45007646083831787, "regret": 0.35710951685905457, "entropy": 0.15600986778736115, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:00:40.232637Z", "loop": 1770, "env_steps": 1088102399, "loss": 0.004060651641339064, "avg_return": 0.45296406745910645, "regret": 0.353811651468277, "entropy": 0.1716134250164032, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:00:41.394941Z", "loop": 1771, "env_steps": 1088716799, "loss": 0.004469354171305895, "avg_return": 0.45301327109336853, "regret": 0.353811651468277, "entropy": 0.1772444248199463, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:00:42.556329Z", "loop": 1772, "env_steps": 1089331199, "loss": 0.004915378522127867, "avg_return": 0.4474569261074066, "regret": 0.353811651468277, "entropy": 0.18114331364631653, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:00:43.716060Z", "loop": 1773, "env_steps": 1089945599, "loss": 0.005411721300333738, "avg_return": 0.4550292193889618, "regret": 0.353811651468277, "entropy": 0.17866481840610504, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:00:44.875686Z", "loop": 1774, "env_steps": 1090559999, "loss": 0.004968628287315369, "avg_return": 0.4519334137439728, "regret": 0.353811651468277, "entropy": 0.16835372149944305, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:00:46.084446Z", "loop": 1775, "env_steps": 1091174399, "loss": 0.004861645866185427, "avg_return": 0.44577476382255554, "regret": 0.35566630959510803, "entropy": 0.16784994304180145, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:00:47.245181Z", "loop": 1776, "env_steps": 1091788799, "loss": 0.005112893413752317, "avg_return": 0.44762519001960754, "regret": 0.35566630959510803, "entropy": 0.16477070748806, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:00:48.404606Z", "loop": 1777, "env_steps": 1092403199, "loss": 0.004878687206655741, "avg_return": 0.4568866491317749, "regret": 0.35566630959510803, "entropy": 0.17051741480827332, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:00:49.565163Z", "loop": 1778, "env_steps": 1093017599, "loss": 0.004597985185682774, "avg_return": 0.4475890100002289, "regret": 0.35566630959510803, "entropy": 0.16730554401874542, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:00:50.726342Z", "loop": 1779, "env_steps": 1093631999, "loss": 0.003618792863562703, "avg_return": 0.4554860591888428, "regret": 0.35566630959510803, "entropy": 0.16778020560741425, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:00:51.930096Z", "loop": 1780, "env_steps": 1094246399, "loss": 0.0032987501472234726, "avg_return": 0.44982993602752686, "regret": 0.35442355275154114, "entropy": 0.14605768024921417, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:00:53.088839Z", "loop": 1781, "env_steps": 1094860799, "loss": 0.0024456221144646406, "avg_return": 0.4475332796573639, "regret": 0.35442355275154114, "entropy": 0.13928931951522827, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:00:54.248709Z", "loop": 1782, "env_steps": 1095475199, "loss": 0.0021258413325995207, "avg_return": 0.4508677124977112, "regret": 0.35442355275154114, "entropy": 0.1312749832868576, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:00:55.409165Z", "loop": 1783, "env_steps": 1096089599, "loss": 0.0019132463494315743, "avg_return": 0.44537273049354553, "regret": 0.35442355275154114, "entropy": 0.13126201927661896, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:00:56.569199Z", "loop": 1784, "env_steps": 1096703999, "loss": 0.0018966967472806573, "avg_return": 0.4497659504413605, "regret": 0.35442355275154114, "entropy": 0.1271403729915619, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:00:57.775160Z", "loop": 1785, "env_steps": 1097318399, "loss": 0.0021435259841382504, "avg_return": 0.44295212626457214, "regret": 0.357817143201828, "entropy": 0.12825962901115417, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:00:58.935825Z", "loop": 1786, "env_steps": 1097932799, "loss": 0.002034879522398114, "avg_return": 0.43746739625930786, "regret": 0.357817143201828, "entropy": 0.13330078125, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:01:00.094785Z", "loop": 1787, "env_steps": 1098547199, "loss": 0.002819696208462119, "avg_return": 0.4502595067024231, "regret": 0.357817143201828, "entropy": 0.13490810990333557, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:01:01.254794Z", "loop": 1788, "env_steps": 1099161599, "loss": 0.002255028812214732, "avg_return": 0.4478396773338318, "regret": 0.357817143201828, "entropy": 0.1298172026872635, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:01:02.415831Z", "loop": 1789, "env_steps": 1099775999, "loss": 0.0019479834008961916, "avg_return": 0.440229207277298, "regret": 0.357817143201828, "entropy": 0.13046762347221375, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:01:03.619473Z", "loop": 1790, "env_steps": 1100390399, "loss": 0.002055998658761382, "avg_return": 0.45404115319252014, "regret": 0.3570411801338196, "entropy": 0.12572288513183594, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:01:04.778766Z", "loop": 1791, "env_steps": 1101004799, "loss": 0.0019436670700088143, "avg_return": 0.4449314475059509, "regret": 0.3570411801338196, "entropy": 0.1318492740392685, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:01:05.938486Z", "loop": 1792, "env_steps": 1101619199, "loss": 0.0022115414030849934, "avg_return": 0.44714677333831787, "regret": 0.3570411801338196, "entropy": 0.12344562262296677, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:01:07.097563Z", "loop": 1793, "env_steps": 1102233599, "loss": 0.0019622293766587973, "avg_return": 0.4468354284763336, "regret": 0.3570411801338196, "entropy": 0.12591126561164856, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:01:08.260251Z", "loop": 1794, "env_steps": 1102847999, "loss": 0.0021656255703419447, "avg_return": 0.45546218752861023, "regret": 0.3570411801338196, "entropy": 0.133201003074646, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:01:09.464696Z", "loop": 1795, "env_steps": 1103462399, "loss": 0.0021291887387633324, "avg_return": 0.44524431228637695, "regret": 0.35479459166526794, "entropy": 0.14266914129257202, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:01:10.627752Z", "loop": 1796, "env_steps": 1104076799, "loss": 0.0024486433248966932, "avg_return": 0.44776028394699097, "regret": 0.35479459166526794, "entropy": 0.1415836066007614, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:01:11.788317Z", "loop": 1797, "env_steps": 1104691199, "loss": 0.0020167971961200237, "avg_return": 0.45201006531715393, "regret": 0.35479459166526794, "entropy": 0.13160282373428345, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:01:12.949364Z", "loop": 1798, "env_steps": 1105305599, "loss": 0.0020924084819853306, "avg_return": 0.44920432567596436, "regret": 0.35479459166526794, "entropy": 0.13795265555381775, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:01:14.111564Z", "loop": 1799, "env_steps": 1105919999, "loss": 0.0021210950799286366, "avg_return": 0.4591972827911377, "regret": 0.35479459166526794, "entropy": 0.13193073868751526, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:01:15.318538Z", "loop": 1800, "env_steps": 1106534399, "loss": 0.002276771003380418, "avg_return": 0.45036739110946655, "regret": 0.3548096716403961, "entropy": 0.132371187210083, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:01:16.479997Z", "loop": 1801, "env_steps": 1107148799, "loss": 0.002063282998278737, "avg_return": 0.45288896560668945, "regret": 0.3548096716403961, "entropy": 0.134010449051857, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:01:17.640012Z", "loop": 1802, "env_steps": 1107763199, "loss": 0.0020137180108577013, "avg_return": 0.4495331943035126, "regret": 0.3548096716403961, "entropy": 0.13852572441101074, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:01:18.801775Z", "loop": 1803, "env_steps": 1108377599, "loss": 0.0024283118546009064, "avg_return": 0.4529202878475189, "regret": 0.3548096716403961, "entropy": 0.1397850066423416, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:01:19.962781Z", "loop": 1804, "env_steps": 1108991999, "loss": 0.002458496717736125, "avg_return": 0.4515021741390228, "regret": 0.3548096716403961, "entropy": 0.14020173251628876, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:01:21.167711Z", "loop": 1805, "env_steps": 1109606399, "loss": 0.0029316472355276346, "avg_return": 0.4525109827518463, "regret": 0.35365352034568787, "entropy": 0.1540014147758484, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:01:22.328278Z", "loop": 1806, "env_steps": 1110220799, "loss": 0.0029486864805221558, "avg_return": 0.4438134729862213, "regret": 0.35365352034568787, "entropy": 0.15726807713508606, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:01:23.488085Z", "loop": 1807, "env_steps": 1110835199, "loss": 0.0035495366901159286, "avg_return": 0.4542643427848816, "regret": 0.35365352034568787, "entropy": 0.15954400599002838, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:01:24.647193Z", "loop": 1808, "env_steps": 1111449599, "loss": 0.004138224758207798, "avg_return": 0.450792133808136, "regret": 0.35365352034568787, "entropy": 0.17100554704666138, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:01:25.806980Z", "loop": 1809, "env_steps": 1112063999, "loss": 0.005039670038968325, "avg_return": 0.4462522566318512, "regret": 0.35365352034568787, "entropy": 0.17406503856182098, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:01:27.009175Z", "loop": 1810, "env_steps": 1112678399, "loss": 0.0050273253582417965, "avg_return": 0.4463525414466858, "regret": 0.35516270995140076, "entropy": 0.16515007615089417, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:01:28.169757Z", "loop": 1811, "env_steps": 1113292799, "loss": 0.0053300876170396805, "avg_return": 0.45822104811668396, "regret": 0.35516270995140076, "entropy": 0.16289250552654266, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:01:29.330308Z", "loop": 1812, "env_steps": 1113907199, "loss": 0.0056219459511339664, "avg_return": 0.4478031396865845, "regret": 0.35516270995140076, "entropy": 0.16686752438545227, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:01:30.491368Z", "loop": 1813, "env_steps": 1114521599, "loss": 0.00508006289601326, "avg_return": 0.4511186182498932, "regret": 0.35516270995140076, "entropy": 0.15846456587314606, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:01:31.651963Z", "loop": 1814, "env_steps": 1115135999, "loss": 0.004703494254499674, "avg_return": 0.45181742310523987, "regret": 0.35516270995140076, "entropy": 0.16036193072795868, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:01:32.857480Z", "loop": 1815, "env_steps": 1115750399, "loss": 0.004708377178758383, "avg_return": 0.4590306580066681, "regret": 0.3534066081047058, "entropy": 0.15956880152225494, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:01:34.017802Z", "loop": 1816, "env_steps": 1116364799, "loss": 0.004528821911662817, "avg_return": 0.4495096802711487, "regret": 0.3534066081047058, "entropy": 0.15350441634655, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:01:35.182442Z", "loop": 1817, "env_steps": 1116979199, "loss": 0.004257857333868742, "avg_return": 0.4521598517894745, "regret": 0.3534066081047058, "entropy": 0.15120825171470642, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:01:36.341260Z", "loop": 1818, "env_steps": 1117593599, "loss": 0.004418648313730955, "avg_return": 0.4565511643886566, "regret": 0.3534066081047058, "entropy": 0.150043323636055, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:01:37.500905Z", "loop": 1819, "env_steps": 1118207999, "loss": 0.004646446090191603, "avg_return": 0.44835156202316284, "regret": 0.3534066081047058, "entropy": 0.15393342077732086, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:01:38.707441Z", "loop": 1820, "env_steps": 1118822399, "loss": 0.004229940474033356, "avg_return": 0.45561712980270386, "regret": 0.3535040020942688, "entropy": 0.14640052616596222, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:01:39.868047Z", "loop": 1821, "env_steps": 1119436799, "loss": 0.0034856244456022978, "avg_return": 0.4490940570831299, "regret": 0.3535040020942688, "entropy": 0.1487240493297577, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:01:41.028032Z", "loop": 1822, "env_steps": 1120051199, "loss": 0.003389158518984914, "avg_return": 0.44672197103500366, "regret": 0.3535040020942688, "entropy": 0.1522447019815445, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:01:42.188307Z", "loop": 1823, "env_steps": 1120665599, "loss": 0.003458482911810279, "avg_return": 0.4497887194156647, "regret": 0.3535040020942688, "entropy": 0.14790433645248413, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:01:43.349794Z", "loop": 1824, "env_steps": 1121279999, "loss": 0.00306393182836473, "avg_return": 0.45218583941459656, "regret": 0.3535040020942688, "entropy": 0.14874885976314545, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:01:44.553474Z", "loop": 1825, "env_steps": 1121894399, "loss": 0.0032035328913480043, "avg_return": 0.45178818702697754, "regret": 0.3540852963924408, "entropy": 0.1400986611843109, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:01:45.712775Z", "loop": 1826, "env_steps": 1122508799, "loss": 0.0038306687492877245, "avg_return": 0.453048974275589, "regret": 0.3540852963924408, "entropy": 0.1524926871061325, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:01:46.872448Z", "loop": 1827, "env_steps": 1123123199, "loss": 0.004053565673530102, "avg_return": 0.44887298345565796, "regret": 0.3540852963924408, "entropy": 0.14477241039276123, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:01:48.032914Z", "loop": 1828, "env_steps": 1123737599, "loss": 0.0035140176769346, "avg_return": 0.45167481899261475, "regret": 0.3540852963924408, "entropy": 0.15118743479251862, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:01:49.192245Z", "loop": 1829, "env_steps": 1124351999, "loss": 0.004188199993222952, "avg_return": 0.4420023262500763, "regret": 0.3540852963924408, "entropy": 0.1491633653640747, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:01:50.394549Z", "loop": 1830, "env_steps": 1124966399, "loss": 0.0040720985271036625, "avg_return": 0.4460195004940033, "regret": 0.3535746932029724, "entropy": 0.14508265256881714, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:01:51.556461Z", "loop": 1831, "env_steps": 1125580799, "loss": 0.004348214715719223, "avg_return": 0.4516938328742981, "regret": 0.3535746932029724, "entropy": 0.15209679305553436, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:01:52.715278Z", "loop": 1832, "env_steps": 1126195199, "loss": 0.004366170149296522, "avg_return": 0.45372799038887024, "regret": 0.3535746932029724, "entropy": 0.1416427195072174, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:01:53.874768Z", "loop": 1833, "env_steps": 1126809599, "loss": 0.004443977493792772, "avg_return": 0.4488988220691681, "regret": 0.3535746932029724, "entropy": 0.144269198179245, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:01:55.035918Z", "loop": 1834, "env_steps": 1127423999, "loss": 0.004508198704570532, "avg_return": 0.4502910077571869, "regret": 0.3535746932029724, "entropy": 0.15169820189476013, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:01:56.242811Z", "loop": 1835, "env_steps": 1128038399, "loss": 0.004230915103107691, "avg_return": 0.45058584213256836, "regret": 0.3533335030078888, "entropy": 0.1457386165857315, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:01:57.404271Z", "loop": 1836, "env_steps": 1128652799, "loss": 0.004032631404697895, "avg_return": 0.45703187584877014, "regret": 0.3533335030078888, "entropy": 0.1479637324810028, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:01:58.564042Z", "loop": 1837, "env_steps": 1129267199, "loss": 0.004777051042765379, "avg_return": 0.45095476508140564, "regret": 0.3533335030078888, "entropy": 0.14905768632888794, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:01:59.726191Z", "loop": 1838, "env_steps": 1129881599, "loss": 0.003992847166955471, "avg_return": 0.44816142320632935, "regret": 0.3533335030078888, "entropy": 0.14949744939804077, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:02:00.887501Z", "loop": 1839, "env_steps": 1130495999, "loss": 0.003920439630746841, "avg_return": 0.44529756903648376, "regret": 0.3533335030078888, "entropy": 0.1434621661901474, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:02:02.095986Z", "loop": 1840, "env_steps": 1131110399, "loss": 0.003994825761765242, "avg_return": 0.45238032937049866, "regret": 0.3533470034599304, "entropy": 0.14918671548366547, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:02:03.256072Z", "loop": 1841, "env_steps": 1131724799, "loss": 0.0037954989820718765, "avg_return": 0.44999635219573975, "regret": 0.3533470034599304, "entropy": 0.1508917212486267, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:02:04.417340Z", "loop": 1842, "env_steps": 1132339199, "loss": 0.003683189395815134, "avg_return": 0.45188766717910767, "regret": 0.3533470034599304, "entropy": 0.1538117527961731, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:02:05.577592Z", "loop": 1843, "env_steps": 1132953599, "loss": 0.0036166019272059202, "avg_return": 0.4476015269756317, "regret": 0.3533470034599304, "entropy": 0.14828234910964966, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:02:06.737640Z", "loop": 1844, "env_steps": 1133567999, "loss": 0.0028225246351212263, "avg_return": 0.45246970653533936, "regret": 0.3533470034599304, "entropy": 0.14267593622207642, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:02:07.940922Z", "loop": 1845, "env_steps": 1134182399, "loss": 0.002523569855839014, "avg_return": 0.4484042525291443, "regret": 0.3542018234729767, "entropy": 0.14431197941303253, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:02:09.101370Z", "loop": 1846, "env_steps": 1134796799, "loss": 0.002477142261341214, "avg_return": 0.4519813656806946, "regret": 0.3542018234729767, "entropy": 0.14362205564975739, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:02:10.260481Z", "loop": 1847, "env_steps": 1135411199, "loss": 0.0024874797090888023, "avg_return": 0.45234957337379456, "regret": 0.3542018234729767, "entropy": 0.13436707854270935, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:02:11.420330Z", "loop": 1848, "env_steps": 1136025599, "loss": 0.002010604366660118, "avg_return": 0.45245322585105896, "regret": 0.3542018234729767, "entropy": 0.1443612426519394, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:02:12.579552Z", "loop": 1849, "env_steps": 1136639999, "loss": 0.0022715418599545956, "avg_return": 0.4597594738006592, "regret": 0.3542018234729767, "entropy": 0.143579363822937, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:02:13.782404Z", "loop": 1850, "env_steps": 1137254399, "loss": 0.0024846226442605257, "avg_return": 0.44716677069664, "regret": 0.35432732105255127, "entropy": 0.14627502858638763, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:02:14.943403Z", "loop": 1851, "env_steps": 1137868799, "loss": 0.002552090911194682, "avg_return": 0.44507142901420593, "regret": 0.35432732105255127, "entropy": 0.14233475923538208, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:02:16.104095Z", "loop": 1852, "env_steps": 1138483199, "loss": 0.0029769630637019873, "avg_return": 0.45558738708496094, "regret": 0.35432732105255127, "entropy": 0.13890890777111053, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:02:17.263911Z", "loop": 1853, "env_steps": 1139097599, "loss": 0.0030773142352700233, "avg_return": 0.4534074366092682, "regret": 0.35432732105255127, "entropy": 0.1425192952156067, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:02:18.423407Z", "loop": 1854, "env_steps": 1139711999, "loss": 0.003674244275316596, "avg_return": 0.45143261551856995, "regret": 0.35432732105255127, "entropy": 0.15139935910701752, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:02:19.626637Z", "loop": 1855, "env_steps": 1140326399, "loss": 0.0037424557376652956, "avg_return": 0.4512064754962921, "regret": 0.3529735505580902, "entropy": 0.1447046399116516, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:02:20.789234Z", "loop": 1856, "env_steps": 1140940799, "loss": 0.003944204654544592, "avg_return": 0.4488288462162018, "regret": 0.3529735505580902, "entropy": 0.15203545987606049, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:02:21.949116Z", "loop": 1857, "env_steps": 1141555199, "loss": 0.004498337395489216, "avg_return": 0.4562138020992279, "regret": 0.3529735505580902, "entropy": 0.14750991761684418, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:02:23.111940Z", "loop": 1858, "env_steps": 1142169599, "loss": 0.004758915398269892, "avg_return": 0.4449191987514496, "regret": 0.3529735505580902, "entropy": 0.14452341198921204, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:02:24.271756Z", "loop": 1859, "env_steps": 1142783999, "loss": 0.005265010986477137, "avg_return": 0.4457743465900421, "regret": 0.3529735505580902, "entropy": 0.1516348272562027, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:02:25.477180Z", "loop": 1860, "env_steps": 1143398399, "loss": 0.005255196243524551, "avg_return": 0.44797807931900024, "regret": 0.3537156283855438, "entropy": 0.15506401658058167, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:02:26.637960Z", "loop": 1861, "env_steps": 1144012799, "loss": 0.004759902600198984, "avg_return": 0.44510194659233093, "regret": 0.3537156283855438, "entropy": 0.14768750965595245, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:02:27.798334Z", "loop": 1862, "env_steps": 1144627199, "loss": 0.005151835270226002, "avg_return": 0.45180827379226685, "regret": 0.3537156283855438, "entropy": 0.15217576920986176, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:02:28.957723Z", "loop": 1863, "env_steps": 1145241599, "loss": 0.004733639303594828, "avg_return": 0.4490870237350464, "regret": 0.3537156283855438, "entropy": 0.14590559899806976, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:02:30.117718Z", "loop": 1864, "env_steps": 1145855999, "loss": 0.004708378110080957, "avg_return": 0.44957178831100464, "regret": 0.3537156283855438, "entropy": 0.1567375361919403, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:02:31.320343Z", "loop": 1865, "env_steps": 1146470399, "loss": 0.0051810587756335735, "avg_return": 0.44701945781707764, "regret": 0.35260340571403503, "entropy": 0.14907613396644592, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:02:32.486311Z", "loop": 1866, "env_steps": 1147084799, "loss": 0.004821514245122671, "avg_return": 0.45697611570358276, "regret": 0.35260340571403503, "entropy": 0.14818735420703888, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:02:33.647052Z", "loop": 1867, "env_steps": 1147699199, "loss": 0.004125702194869518, "avg_return": 0.4543219208717346, "regret": 0.35260340571403503, "entropy": 0.15595345199108124, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:02:34.807179Z", "loop": 1868, "env_steps": 1148313599, "loss": 0.003792982315644622, "avg_return": 0.4529670178890228, "regret": 0.35260340571403503, "entropy": 0.15536589920520782, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:02:35.966402Z", "loop": 1869, "env_steps": 1148927999, "loss": 0.0034032200928777456, "avg_return": 0.45393016934394836, "regret": 0.35260340571403503, "entropy": 0.15436948835849762, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:02:37.174063Z", "loop": 1870, "env_steps": 1149542399, "loss": 0.0031861532479524612, "avg_return": 0.44830963015556335, "regret": 0.352601021528244, "entropy": 0.1538352072238922, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:02:38.333680Z", "loop": 1871, "env_steps": 1150156799, "loss": 0.0027474313974380493, "avg_return": 0.4510025680065155, "regret": 0.352601021528244, "entropy": 0.1529262363910675, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:02:39.493645Z", "loop": 1872, "env_steps": 1150771199, "loss": 0.002782047726213932, "avg_return": 0.45276886224746704, "regret": 0.352601021528244, "entropy": 0.1420343965291977, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:02:40.653130Z", "loop": 1873, "env_steps": 1151385599, "loss": 0.0025598835200071335, "avg_return": 0.4459349811077118, "regret": 0.352601021528244, "entropy": 0.14773765206336975, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:02:41.812451Z", "loop": 1874, "env_steps": 1151999999, "loss": 0.002613853896036744, "avg_return": 0.44778960943222046, "regret": 0.352601021528244, "entropy": 0.15106193721294403, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:02:43.016260Z", "loop": 1875, "env_steps": 1152614399, "loss": 0.0027696758043020964, "avg_return": 0.4456689655780792, "regret": 0.3523522913455963, "entropy": 0.14593487977981567, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:02:44.176252Z", "loop": 1876, "env_steps": 1153228799, "loss": 0.003073005937039852, "avg_return": 0.45955345034599304, "regret": 0.3523522913455963, "entropy": 0.15524473786354065, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:02:45.335402Z", "loop": 1877, "env_steps": 1153843199, "loss": 0.003280425211414695, "avg_return": 0.4482311010360718, "regret": 0.3523522913455963, "entropy": 0.15024207532405853, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:02:46.495128Z", "loop": 1878, "env_steps": 1154457599, "loss": 0.00379193015396595, "avg_return": 0.4516693651676178, "regret": 0.3523522913455963, "entropy": 0.15345676243305206, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:02:47.655862Z", "loop": 1879, "env_steps": 1155071999, "loss": 0.00358596327714622, "avg_return": 0.4535965025424957, "regret": 0.3523522913455963, "entropy": 0.15626460313796997, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:02:48.859412Z", "loop": 1880, "env_steps": 1155686399, "loss": 0.004102808423340321, "avg_return": 0.4434987008571625, "regret": 0.35218578577041626, "entropy": 0.1693723499774933, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:02:50.019325Z", "loop": 1881, "env_steps": 1156300799, "loss": 0.004351260606199503, "avg_return": 0.4486037790775299, "regret": 0.35218578577041626, "entropy": 0.1658625304698944, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:02:51.179735Z", "loop": 1882, "env_steps": 1156915199, "loss": 0.005137123633176088, "avg_return": 0.45070725679397583, "regret": 0.35218578577041626, "entropy": 0.1712997555732727, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:02:52.339345Z", "loop": 1883, "env_steps": 1157529599, "loss": 0.0048782662488520145, "avg_return": 0.4463392198085785, "regret": 0.35218578577041626, "entropy": 0.17253847420215607, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:02:53.498870Z", "loop": 1884, "env_steps": 1158143999, "loss": 0.005582447163760662, "avg_return": 0.4570140242576599, "regret": 0.35218578577041626, "entropy": 0.17289598286151886, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:02:54.703308Z", "loop": 1885, "env_steps": 1158758399, "loss": 0.00521994661539793, "avg_return": 0.4543529450893402, "regret": 0.353478342294693, "entropy": 0.16917505860328674, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:02:55.863923Z", "loop": 1886, "env_steps": 1159372799, "loss": 0.00517842173576355, "avg_return": 0.4590775668621063, "regret": 0.353478342294693, "entropy": 0.1632111668586731, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:02:57.023903Z", "loop": 1887, "env_steps": 1159987199, "loss": 0.004333298187702894, "avg_return": 0.4530503451824188, "regret": 0.353478342294693, "entropy": 0.17446233332157135, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:02:58.185139Z", "loop": 1888, "env_steps": 1160601599, "loss": 0.0047619580291211605, "avg_return": 0.4534328281879425, "regret": 0.353478342294693, "entropy": 0.16275589168071747, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:02:59.346814Z", "loop": 1889, "env_steps": 1161215999, "loss": 0.004575060680508614, "avg_return": 0.4534603953361511, "regret": 0.353478342294693, "entropy": 0.1625996083021164, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:03:00.551121Z", "loop": 1890, "env_steps": 1161830399, "loss": 0.005316910799592733, "avg_return": 0.4483567476272583, "regret": 0.3529953062534332, "entropy": 0.16827167570590973, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:03:01.710705Z", "loop": 1891, "env_steps": 1162444799, "loss": 0.004897099919617176, "avg_return": 0.44892334938049316, "regret": 0.3529953062534332, "entropy": 0.16832812130451202, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:03:02.872032Z", "loop": 1892, "env_steps": 1163059199, "loss": 0.0049905977211892605, "avg_return": 0.44201138615608215, "regret": 0.3529953062534332, "entropy": 0.1725185364484787, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:03:04.034496Z", "loop": 1893, "env_steps": 1163673599, "loss": 0.004758933093398809, "avg_return": 0.45115241408348083, "regret": 0.3529953062534332, "entropy": 0.163503497838974, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:03:05.194738Z", "loop": 1894, "env_steps": 1164287999, "loss": 0.004642115440219641, "avg_return": 0.4469982981681824, "regret": 0.3529953062534332, "entropy": 0.16606596112251282, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:03:06.414228Z", "loop": 1895, "env_steps": 1164902399, "loss": 0.004362098407000303, "avg_return": 0.4485238790512085, "regret": 0.3524857759475708, "entropy": 0.16368596255779266, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:03:07.576343Z", "loop": 1896, "env_steps": 1165516799, "loss": 0.004762762691825628, "avg_return": 0.4556688666343689, "regret": 0.3524857759475708, "entropy": 0.15938536822795868, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:03:08.737058Z", "loop": 1897, "env_steps": 1166131199, "loss": 0.004800925496965647, "avg_return": 0.45333969593048096, "regret": 0.3524857759475708, "entropy": 0.15522125363349915, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:03:09.896138Z", "loop": 1898, "env_steps": 1166745599, "loss": 0.0042323279194533825, "avg_return": 0.45433562994003296, "regret": 0.3524857759475708, "entropy": 0.15779496729373932, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:03:11.056631Z", "loop": 1899, "env_steps": 1167359999, "loss": 0.0037861305754631758, "avg_return": 0.4468706250190735, "regret": 0.3524857759475708, "entropy": 0.15446993708610535, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:03:12.261520Z", "loop": 1900, "env_steps": 1167974399, "loss": 0.003697127802297473, "avg_return": 0.44959336519241333, "regret": 0.3519623577594757, "entropy": 0.15567117929458618, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:03:13.423230Z", "loop": 1901, "env_steps": 1168588799, "loss": 0.003573716850951314, "avg_return": 0.45370718836784363, "regret": 0.3519623577594757, "entropy": 0.15205447375774384, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:03:14.583561Z", "loop": 1902, "env_steps": 1169203199, "loss": 0.0032186799217015505, "avg_return": 0.452261358499527, "regret": 0.3519623577594757, "entropy": 0.15182912349700928, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:03:15.743716Z", "loop": 1903, "env_steps": 1169817599, "loss": 0.0029610737692564726, "avg_return": 0.4554833471775055, "regret": 0.3519623577594757, "entropy": 0.14676815271377563, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:03:16.904270Z", "loop": 1904, "env_steps": 1170431999, "loss": 0.002820698544383049, "avg_return": 0.45762911438941956, "regret": 0.3519623577594757, "entropy": 0.14113521575927734, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:03:18.109362Z", "loop": 1905, "env_steps": 1171046399, "loss": 0.0025178506039083004, "avg_return": 0.45577359199523926, "regret": 0.35258200764656067, "entropy": 0.1352778524160385, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:03:19.269239Z", "loop": 1906, "env_steps": 1171660799, "loss": 0.002043974818661809, "avg_return": 0.4507680833339691, "regret": 0.35258200764656067, "entropy": 0.1273471713066101, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:03:20.428787Z", "loop": 1907, "env_steps": 1172275199, "loss": 0.0019569776486605406, "avg_return": 0.4465788006782532, "regret": 0.35258200764656067, "entropy": 0.12622126936912537, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:03:21.587766Z", "loop": 1908, "env_steps": 1172889599, "loss": 0.0020407529082149267, "avg_return": 0.45604538917541504, "regret": 0.35258200764656067, "entropy": 0.1253422051668167, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:03:22.747463Z", "loop": 1909, "env_steps": 1173503999, "loss": 0.002119525335729122, "avg_return": 0.45143628120422363, "regret": 0.35258200764656067, "entropy": 0.1331070363521576, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:03:23.953130Z", "loop": 1910, "env_steps": 1174118399, "loss": 0.0019709395710378885, "avg_return": 0.4411749839782715, "regret": 0.353129118680954, "entropy": 0.13364487886428833, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:03:25.113859Z", "loop": 1911, "env_steps": 1174732799, "loss": 0.002112335292622447, "avg_return": 0.45226991176605225, "regret": 0.353129118680954, "entropy": 0.13351666927337646, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:03:26.273678Z", "loop": 1912, "env_steps": 1175347199, "loss": 0.0023128704633563757, "avg_return": 0.447739839553833, "regret": 0.353129118680954, "entropy": 0.13067302107810974, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:03:27.434294Z", "loop": 1913, "env_steps": 1175961599, "loss": 0.002424471313133836, "avg_return": 0.448944091796875, "regret": 0.353129118680954, "entropy": 0.1319151371717453, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:03:28.595958Z", "loop": 1914, "env_steps": 1176575999, "loss": 0.002305296016857028, "avg_return": 0.4514896869659424, "regret": 0.353129118680954, "entropy": 0.13510176539421082, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:03:29.800596Z", "loop": 1915, "env_steps": 1177190399, "loss": 0.0024180649779736996, "avg_return": 0.45190665125846863, "regret": 0.35234737396240234, "entropy": 0.13873586058616638, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:03:30.966976Z", "loop": 1916, "env_steps": 1177804799, "loss": 0.002545593772083521, "avg_return": 0.4549442529678345, "regret": 0.35234737396240234, "entropy": 0.142501100897789, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:03:32.126945Z", "loop": 1917, "env_steps": 1178419199, "loss": 0.00301527651026845, "avg_return": 0.4491177499294281, "regret": 0.35234737396240234, "entropy": 0.14698751270771027, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:03:33.288371Z", "loop": 1918, "env_steps": 1179033599, "loss": 0.003775503486394882, "avg_return": 0.44599688053131104, "regret": 0.35234737396240234, "entropy": 0.16498245298862457, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:03:34.448114Z", "loop": 1919, "env_steps": 1179647999, "loss": 0.0043700444512069225, "avg_return": 0.45346564054489136, "regret": 0.35234737396240234, "entropy": 0.17778830230236053, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:03:35.653509Z", "loop": 1920, "env_steps": 1180262399, "loss": 0.005067150574177504, "avg_return": 0.4503819942474365, "regret": 0.3555826246738434, "entropy": 0.17494647204875946, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:03:36.814717Z", "loop": 1921, "env_steps": 1180876799, "loss": 0.005368131212890148, "avg_return": 0.44308626651763916, "regret": 0.3555826246738434, "entropy": 0.18297767639160156, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:03:37.975638Z", "loop": 1922, "env_steps": 1181491199, "loss": 0.005082054529339075, "avg_return": 0.4372338056564331, "regret": 0.3555826246738434, "entropy": 0.1719583421945572, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:03:39.135172Z", "loop": 1923, "env_steps": 1182105599, "loss": 0.005000665318220854, "avg_return": 0.43856945633888245, "regret": 0.3555826246738434, "entropy": 0.1657421588897705, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:03:40.295223Z", "loop": 1924, "env_steps": 1182719999, "loss": 0.0053116981871426105, "avg_return": 0.4405289888381958, "regret": 0.3555826246738434, "entropy": 0.17237789928913116, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:03:41.500314Z", "loop": 1925, "env_steps": 1183334399, "loss": 0.005180157721042633, "avg_return": 0.4557377099990845, "regret": 0.3552212119102478, "entropy": 0.15777595341205597, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:03:42.661213Z", "loop": 1926, "env_steps": 1183948799, "loss": 0.005423048976808786, "avg_return": 0.44825685024261475, "regret": 0.3552212119102478, "entropy": 0.1615433394908905, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:03:43.820959Z", "loop": 1927, "env_steps": 1184563199, "loss": 0.004318885039538145, "avg_return": 0.45550069212913513, "regret": 0.3552212119102478, "entropy": 0.14881010353565216, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:03:44.982044Z", "loop": 1928, "env_steps": 1185177599, "loss": 0.004362579435110092, "avg_return": 0.448906272649765, "regret": 0.3552212119102478, "entropy": 0.1478962004184723, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:03:46.141834Z", "loop": 1929, "env_steps": 1185791999, "loss": 0.004404299892485142, "avg_return": 0.45638713240623474, "regret": 0.3552212119102478, "entropy": 0.14118912816047668, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:03:47.353276Z", "loop": 1930, "env_steps": 1186406399, "loss": 0.0037041602190583944, "avg_return": 0.45145946741104126, "regret": 0.35213443636894226, "entropy": 0.1374063342809677, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:03:48.512860Z", "loop": 1931, "env_steps": 1187020799, "loss": 0.0042205615900456905, "avg_return": 0.44902294874191284, "regret": 0.35213443636894226, "entropy": 0.13246947526931763, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:03:49.672808Z", "loop": 1932, "env_steps": 1187635199, "loss": 0.004013991914689541, "avg_return": 0.45721274614334106, "regret": 0.35213443636894226, "entropy": 0.1347561627626419, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:03:50.832188Z", "loop": 1933, "env_steps": 1188249599, "loss": 0.004628212656825781, "avg_return": 0.45551636815071106, "regret": 0.35213443636894226, "entropy": 0.13930566608905792, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:03:51.992185Z", "loop": 1934, "env_steps": 1188863999, "loss": 0.00417910935357213, "avg_return": 0.45577484369277954, "regret": 0.35213443636894226, "entropy": 0.1317928284406662, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:03:53.197300Z", "loop": 1935, "env_steps": 1189478399, "loss": 0.004000748973339796, "avg_return": 0.4458949863910675, "regret": 0.3525969386100769, "entropy": 0.13038992881774902, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:03:54.357743Z", "loop": 1936, "env_steps": 1190092799, "loss": 0.004345896188169718, "avg_return": 0.448148250579834, "regret": 0.3525969386100769, "entropy": 0.13031525909900665, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:03:55.517027Z", "loop": 1937, "env_steps": 1190707199, "loss": 0.004246801137924194, "avg_return": 0.4514003098011017, "regret": 0.3525969386100769, "entropy": 0.1300857663154602, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:03:56.677366Z", "loop": 1938, "env_steps": 1191321599, "loss": 0.004738945048302412, "avg_return": 0.45127370953559875, "regret": 0.3525969386100769, "entropy": 0.13277724385261536, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:03:57.836303Z", "loop": 1939, "env_steps": 1191935999, "loss": 0.004362024366855621, "avg_return": 0.4562700390815735, "regret": 0.3525969386100769, "entropy": 0.12937624752521515, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:03:59.039938Z", "loop": 1940, "env_steps": 1192550399, "loss": 0.00413852371275425, "avg_return": 0.4453465938568115, "regret": 0.3525067865848541, "entropy": 0.1350293904542923, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:04:00.200331Z", "loop": 1941, "env_steps": 1193164799, "loss": 0.004018325824290514, "avg_return": 0.46134400367736816, "regret": 0.3525067865848541, "entropy": 0.13868814706802368, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:04:01.361998Z", "loop": 1942, "env_steps": 1193779199, "loss": 0.003921155352145433, "avg_return": 0.4536101520061493, "regret": 0.3525067865848541, "entropy": 0.13499124348163605, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:04:02.521566Z", "loop": 1943, "env_steps": 1194393599, "loss": 0.003273244947195053, "avg_return": 0.44785502552986145, "regret": 0.3525067865848541, "entropy": 0.14492541551589966, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:04:03.681850Z", "loop": 1944, "env_steps": 1195007999, "loss": 0.003532238770276308, "avg_return": 0.457920640707016, "regret": 0.3525067865848541, "entropy": 0.1498042494058609, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:04:04.886441Z", "loop": 1945, "env_steps": 1195622399, "loss": 0.0032414444722235203, "avg_return": 0.4491669237613678, "regret": 0.35343489050865173, "entropy": 0.14502425491809845, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:04:06.047755Z", "loop": 1946, "env_steps": 1196236799, "loss": 0.0025713439099490643, "avg_return": 0.44667670130729675, "regret": 0.35343489050865173, "entropy": 0.14124621450901031, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:04:07.207193Z", "loop": 1947, "env_steps": 1196851199, "loss": 0.0025039303582161665, "avg_return": 0.4503542184829712, "regret": 0.35343489050865173, "entropy": 0.13264596462249756, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:04:08.368113Z", "loop": 1948, "env_steps": 1197465599, "loss": 0.0022686689626425505, "avg_return": 0.4515758454799652, "regret": 0.35343489050865173, "entropy": 0.13377852737903595, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:04:09.529121Z", "loop": 1949, "env_steps": 1198079999, "loss": 0.002000570297241211, "avg_return": 0.45052146911621094, "regret": 0.35343489050865173, "entropy": 0.13710640370845795, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:04:10.734586Z", "loop": 1950, "env_steps": 1198694399, "loss": 0.00224410742521286, "avg_return": 0.4511885643005371, "regret": 0.3541131913661957, "entropy": 0.1326877474784851, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:04:11.895819Z", "loop": 1951, "env_steps": 1199308799, "loss": 0.002077495213598013, "avg_return": 0.45698481798171997, "regret": 0.3541131913661957, "entropy": 0.1270817667245865, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:04:13.058950Z", "loop": 1952, "env_steps": 1199923199, "loss": 0.002111670095473528, "avg_return": 0.45479461550712585, "regret": 0.3541131913661957, "entropy": 0.1282588541507721, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:04:14.219566Z", "loop": 1953, "env_steps": 1200537599, "loss": 0.0021003209985792637, "avg_return": 0.4567197263240814, "regret": 0.3541131913661957, "entropy": 0.129560649394989, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:04:15.379868Z", "loop": 1954, "env_steps": 1201151999, "loss": 0.001930884667672217, "avg_return": 0.453975647687912, "regret": 0.3541131913661957, "entropy": 0.12630735337734222, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:04:16.585109Z", "loop": 1955, "env_steps": 1201766399, "loss": 0.0020397573243826628, "avg_return": 0.4430079758167267, "regret": 0.35372185707092285, "entropy": 0.12788590788841248, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:04:17.747471Z", "loop": 1956, "env_steps": 1202380799, "loss": 0.0017002711538225412, "avg_return": 0.4492615759372711, "regret": 0.35372185707092285, "entropy": 0.13248895108699799, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:04:18.909770Z", "loop": 1957, "env_steps": 1202995199, "loss": 0.001761034713126719, "avg_return": 0.4440547823905945, "regret": 0.35372185707092285, "entropy": 0.13141153752803802, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:04:20.068625Z", "loop": 1958, "env_steps": 1203609599, "loss": 0.0015837649116292596, "avg_return": 0.4454750120639801, "regret": 0.35372185707092285, "entropy": 0.12573140859603882, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:04:21.229122Z", "loop": 1959, "env_steps": 1204223999, "loss": 0.001860388438217342, "avg_return": 0.4467296600341797, "regret": 0.35372185707092285, "entropy": 0.12108782678842545, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:04:22.434069Z", "loop": 1960, "env_steps": 1204838399, "loss": 0.0018508801003918052, "avg_return": 0.44957277178764343, "regret": 0.35397422313690186, "entropy": 0.12767226994037628, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:04:23.595251Z", "loop": 1961, "env_steps": 1205452799, "loss": 0.0017504303250461817, "avg_return": 0.4514843821525574, "regret": 0.35397422313690186, "entropy": 0.12411432713270187, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:04:24.755331Z", "loop": 1962, "env_steps": 1206067199, "loss": 0.0017791141290217638, "avg_return": 0.4535564184188843, "regret": 0.35397422313690186, "entropy": 0.12695512175559998, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:04:25.916298Z", "loop": 1963, "env_steps": 1206681599, "loss": 0.0019703004509210587, "avg_return": 0.4515845477581024, "regret": 0.35397422313690186, "entropy": 0.12177423387765884, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:04:27.076054Z", "loop": 1964, "env_steps": 1207295999, "loss": 0.0017022278625518084, "avg_return": 0.4411313533782959, "regret": 0.35397422313690186, "entropy": 0.1194402351975441, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:04:28.280618Z", "loop": 1965, "env_steps": 1207910399, "loss": 0.00204168981872499, "avg_return": 0.4483937621116638, "regret": 0.35266420245170593, "entropy": 0.12715065479278564, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:04:29.440985Z", "loop": 1966, "env_steps": 1208524799, "loss": 0.0020211029332131147, "avg_return": 0.45441731810569763, "regret": 0.35266420245170593, "entropy": 0.12947110831737518, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:04:30.603118Z", "loop": 1967, "env_steps": 1209139199, "loss": 0.0021265314426273108, "avg_return": 0.4588019549846649, "regret": 0.35266420245170593, "entropy": 0.12580788135528564, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:04:31.763746Z", "loop": 1968, "env_steps": 1209753599, "loss": 0.0021357988007366657, "avg_return": 0.4533647298812866, "regret": 0.35266420245170593, "entropy": 0.13065025210380554, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:04:32.925310Z", "loop": 1969, "env_steps": 1210367999, "loss": 0.0021641100756824017, "avg_return": 0.45859208703041077, "regret": 0.35266420245170593, "entropy": 0.13748928904533386, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:04:34.134083Z", "loop": 1970, "env_steps": 1210982399, "loss": 0.002294437261298299, "avg_return": 0.44285696744918823, "regret": 0.35178154706954956, "entropy": 0.13625892996788025, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:04:35.295848Z", "loop": 1971, "env_steps": 1211596799, "loss": 0.002571725519374013, "avg_return": 0.4476584494113922, "regret": 0.35178154706954956, "entropy": 0.1416076123714447, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:04:36.456940Z", "loop": 1972, "env_steps": 1212211199, "loss": 0.003309995634481311, "avg_return": 0.45345190167427063, "regret": 0.35178154706954956, "entropy": 0.15637175738811493, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:04:37.617820Z", "loop": 1973, "env_steps": 1212825599, "loss": 0.003802558872848749, "avg_return": 0.4488467574119568, "regret": 0.35178154706954956, "entropy": 0.15842404961585999, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:04:38.779202Z", "loop": 1974, "env_steps": 1213439999, "loss": 0.0041224961169064045, "avg_return": 0.44827643036842346, "regret": 0.35178154706954956, "entropy": 0.16191965341567993, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:04:39.985779Z", "loop": 1975, "env_steps": 1214054399, "loss": 0.004353336524218321, "avg_return": 0.45384538173675537, "regret": 0.3530515134334564, "entropy": 0.17755289375782013, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:04:41.147743Z", "loop": 1976, "env_steps": 1214668799, "loss": 0.004002574365586042, "avg_return": 0.45139309763908386, "regret": 0.3530515134334564, "entropy": 0.17194688320159912, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:04:42.308864Z", "loop": 1977, "env_steps": 1215283199, "loss": 0.004106440581381321, "avg_return": 0.44647249579429626, "regret": 0.3530515134334564, "entropy": 0.17477408051490784, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:04:43.469621Z", "loop": 1978, "env_steps": 1215897599, "loss": 0.004012265708297491, "avg_return": 0.45365890860557556, "regret": 0.3530515134334564, "entropy": 0.16870877146720886, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:04:44.631968Z", "loop": 1979, "env_steps": 1216511999, "loss": 0.003935803659260273, "avg_return": 0.44955119490623474, "regret": 0.3530515134334564, "entropy": 0.1602107137441635, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:04:45.840286Z", "loop": 1980, "env_steps": 1217126399, "loss": 0.0036551491357386112, "avg_return": 0.4499039947986603, "regret": 0.35209500789642334, "entropy": 0.16043516993522644, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:04:47.001631Z", "loop": 1981, "env_steps": 1217740799, "loss": 0.0037481430917978287, "avg_return": 0.45339295268058777, "regret": 0.35209500789642334, "entropy": 0.156118705868721, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:04:48.162182Z", "loop": 1982, "env_steps": 1218355199, "loss": 0.003961864858865738, "avg_return": 0.459135502576828, "regret": 0.35209500789642334, "entropy": 0.1523359715938568, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:04:49.323539Z", "loop": 1983, "env_steps": 1218969599, "loss": 0.003575911046937108, "avg_return": 0.45849162340164185, "regret": 0.35209500789642334, "entropy": 0.15044139325618744, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:04:50.485530Z", "loop": 1984, "env_steps": 1219583999, "loss": 0.003374530468136072, "avg_return": 0.45812052488327026, "regret": 0.35209500789642334, "entropy": 0.15130102634429932, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:04:51.694035Z", "loop": 1985, "env_steps": 1220198399, "loss": 0.0032623608130961657, "avg_return": 0.45546966791152954, "regret": 0.35165366530418396, "entropy": 0.14941522479057312, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:04:52.854478Z", "loop": 1986, "env_steps": 1220812799, "loss": 0.0027188374660909176, "avg_return": 0.44563212990760803, "regret": 0.35165366530418396, "entropy": 0.14245052635669708, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:04:54.015374Z", "loop": 1987, "env_steps": 1221427199, "loss": 0.002490576123818755, "avg_return": 0.4480392038822174, "regret": 0.35165366530418396, "entropy": 0.13740186393260956, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:04:55.176037Z", "loop": 1988, "env_steps": 1222041599, "loss": 0.0027161187026649714, "avg_return": 0.45121175050735474, "regret": 0.35165366530418396, "entropy": 0.13680386543273926, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:04:56.335715Z", "loop": 1989, "env_steps": 1222655999, "loss": 0.0028565300162881613, "avg_return": 0.4572136104106903, "regret": 0.35165366530418396, "entropy": 0.13577818870544434, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:04:57.541082Z", "loop": 1990, "env_steps": 1223270399, "loss": 0.0025237216614186764, "avg_return": 0.45587819814682007, "regret": 0.3515681028366089, "entropy": 0.1383596509695053, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:04:58.701935Z", "loop": 1991, "env_steps": 1223884799, "loss": 0.002544720657169819, "avg_return": 0.4521138072013855, "regret": 0.3515681028366089, "entropy": 0.13138611614704132, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:04:59.862001Z", "loop": 1992, "env_steps": 1224499199, "loss": 0.0020922087132930756, "avg_return": 0.45376506447792053, "regret": 0.3515681028366089, "entropy": 0.13082559406757355, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:05:01.021635Z", "loop": 1993, "env_steps": 1225113599, "loss": 0.001814449205994606, "avg_return": 0.45016413927078247, "regret": 0.3515681028366089, "entropy": 0.13173821568489075, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:05:02.182554Z", "loop": 1994, "env_steps": 1225727999, "loss": 0.002000456443056464, "avg_return": 0.4537140429019928, "regret": 0.3515681028366089, "entropy": 0.12131616473197937, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:05:03.389223Z", "loop": 1995, "env_steps": 1226342399, "loss": 0.0018764410633593798, "avg_return": 0.44269371032714844, "regret": 0.3519921898841858, "entropy": 0.12649065256118774, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:05:04.550371Z", "loop": 1996, "env_steps": 1226956799, "loss": 0.0020487825386226177, "avg_return": 0.45255544781684875, "regret": 0.3519921898841858, "entropy": 0.12314177304506302, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:05:05.710300Z", "loop": 1997, "env_steps": 1227571199, "loss": 0.0018847136525437236, "avg_return": 0.45894327759742737, "regret": 0.3519921898841858, "entropy": 0.11721266806125641, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:05:06.871058Z", "loop": 1998, "env_steps": 1228185599, "loss": 0.0019707162864506245, "avg_return": 0.4508070945739746, "regret": 0.3519921898841858, "entropy": 0.12092286348342896, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:05:08.031999Z", "loop": 1999, "env_steps": 1228799999, "loss": 0.002197865629568696, "avg_return": 0.4573943316936493, "regret": 0.3519921898841858, "entropy": 0.12457585334777832, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:05:09.236210Z", "loop": 2000, "env_steps": 1229414399, "loss": 0.0025282753631472588, "avg_return": 0.45035097002983093, "regret": 0.35287636518478394, "entropy": 0.1313617080450058, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:05:10.396233Z", "loop": 2001, "env_steps": 1230028799, "loss": 0.002476105000823736, "avg_return": 0.448413610458374, "regret": 0.35287636518478394, "entropy": 0.12699374556541443, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:05:11.556427Z", "loop": 2002, "env_steps": 1230643199, "loss": 0.0025634216144680977, "avg_return": 0.44674578309059143, "regret": 0.35287636518478394, "entropy": 0.13431410491466522, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:05:12.717105Z", "loop": 2003, "env_steps": 1231257599, "loss": 0.0025906809605658054, "avg_return": 0.45060262084007263, "regret": 0.35287636518478394, "entropy": 0.1318279206752777, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:05:13.876615Z", "loop": 2004, "env_steps": 1231871999, "loss": 0.0023979635443538427, "avg_return": 0.45261770486831665, "regret": 0.35287636518478394, "entropy": 0.12220067530870438, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:05:15.037455Z", "loop": 2005, "env_steps": 1232486399, "loss": 0.0021821281407028437, "avg_return": 0.4531990587711334, "regret": 0.35287636518478394, "entropy": 0.12543106079101562, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:05:16.197248Z", "loop": 2006, "env_steps": 1233100799, "loss": 0.0019567457493394613, "avg_return": 0.45913055539131165, "regret": 0.35287636518478394, "entropy": 0.1224011480808258, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:05:17.357333Z", "loop": 2007, "env_steps": 1233715199, "loss": 0.0020785366650670767, "avg_return": 0.45052215456962585, "regret": 0.35287636518478394, "entropy": 0.11787882447242737, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:05:18.516783Z", "loop": 2008, "env_steps": 1234329599, "loss": 0.0020377447362989187, "avg_return": 0.4448159337043762, "regret": 0.35287636518478394, "entropy": 0.11813724040985107, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:05:19.676941Z", "loop": 2009, "env_steps": 1234943999, "loss": 0.0017967353342100978, "avg_return": 0.4559354782104492, "regret": 0.35287636518478394, "entropy": 0.11924660205841064, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:05:20.884975Z", "loop": 2010, "env_steps": 1235558399, "loss": 0.002003232715651393, "avg_return": 0.44675374031066895, "regret": 0.3515055477619171, "entropy": 0.12597128748893738, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:05:22.047709Z", "loop": 2011, "env_steps": 1236172799, "loss": 0.0027362650725990534, "avg_return": 0.4495542645454407, "regret": 0.3515055477619171, "entropy": 0.14123490452766418, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:05:23.208891Z", "loop": 2012, "env_steps": 1236787199, "loss": 0.0028548426926136017, "avg_return": 0.45855817198753357, "regret": 0.3515055477619171, "entropy": 0.1362723410129547, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:05:24.368794Z", "loop": 2013, "env_steps": 1237401599, "loss": 0.0029488014988601208, "avg_return": 0.44590410590171814, "regret": 0.3515055477619171, "entropy": 0.1378612518310547, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:05:25.529401Z", "loop": 2014, "env_steps": 1238015999, "loss": 0.003459017025306821, "avg_return": 0.45826423168182373, "regret": 0.3515055477619171, "entropy": 0.14215132594108582, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:05:26.694035Z", "loop": 2015, "env_steps": 1238630399, "loss": 0.0035975768696516752, "avg_return": 0.4539821445941925, "regret": 0.3515055477619171, "entropy": 0.1434195637702942, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:05:27.857582Z", "loop": 2016, "env_steps": 1239244799, "loss": 0.003048766404390335, "avg_return": 0.44522684812545776, "regret": 0.3515055477619171, "entropy": 0.14942684769630432, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:05:29.018172Z", "loop": 2017, "env_steps": 1239859199, "loss": 0.002892708405852318, "avg_return": 0.45251500606536865, "regret": 0.3515055477619171, "entropy": 0.1363043189048767, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:05:30.178300Z", "loop": 2018, "env_steps": 1240473599, "loss": 0.0027111030649393797, "avg_return": 0.4530962109565735, "regret": 0.3515055477619171, "entropy": 0.13442526757717133, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:05:31.339536Z", "loop": 2019, "env_steps": 1241087999, "loss": 0.0023349926341325045, "avg_return": 0.44623255729675293, "regret": 0.3515055477619171, "entropy": 0.13405835628509521, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:05:32.548239Z", "loop": 2020, "env_steps": 1241702399, "loss": 0.002089333487674594, "avg_return": 0.4481429159641266, "regret": 0.35147395730018616, "entropy": 0.12168807536363602, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:05:33.709129Z", "loop": 2021, "env_steps": 1242316799, "loss": 0.0020440963562577963, "avg_return": 0.4474872946739197, "regret": 0.35147395730018616, "entropy": 0.11988036334514618, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:05:34.868726Z", "loop": 2022, "env_steps": 1242931199, "loss": 0.002041237661615014, "avg_return": 0.4499102234840393, "regret": 0.35147395730018616, "entropy": 0.1188652291893959, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:05:36.030117Z", "loop": 2023, "env_steps": 1243545599, "loss": 0.0017390262801200151, "avg_return": 0.4611845016479492, "regret": 0.35147395730018616, "entropy": 0.11883436888456345, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:05:37.193189Z", "loop": 2024, "env_steps": 1244159999, "loss": 0.001748922630213201, "avg_return": 0.45753052830696106, "regret": 0.35147395730018616, "entropy": 0.11473255604505539, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:05:38.353462Z", "loop": 2025, "env_steps": 1244774399, "loss": 0.0016136768972501159, "avg_return": 0.4485403597354889, "regret": 0.35147395730018616, "entropy": 0.12341387569904327, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:05:39.512828Z", "loop": 2026, "env_steps": 1245388799, "loss": 0.0017125230515375733, "avg_return": 0.4503779709339142, "regret": 0.35147395730018616, "entropy": 0.11824905127286911, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:05:40.672747Z", "loop": 2027, "env_steps": 1246003199, "loss": 0.0018488947534933686, "avg_return": 0.4496479332447052, "regret": 0.35147395730018616, "entropy": 0.11791112273931503, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:05:41.834961Z", "loop": 2028, "env_steps": 1246617599, "loss": 0.0018028483027592301, "avg_return": 0.4447309374809265, "regret": 0.35147395730018616, "entropy": 0.12398655712604523, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:05:42.996073Z", "loop": 2029, "env_steps": 1247231999, "loss": 0.002297385362908244, "avg_return": 0.45319193601608276, "regret": 0.35147395730018616, "entropy": 0.11910116672515869, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:05:44.203275Z", "loop": 2030, "env_steps": 1247846399, "loss": 0.0022826152853667736, "avg_return": 0.450061559677124, "regret": 0.35145509243011475, "entropy": 0.12563258409500122, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:05:45.363285Z", "loop": 2031, "env_steps": 1248460799, "loss": 0.0021875989623367786, "avg_return": 0.45573458075523376, "regret": 0.35145509243011475, "entropy": 0.13061848282814026, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:05:46.524999Z", "loop": 2032, "env_steps": 1249075199, "loss": 0.002672299277037382, "avg_return": 0.4490800201892853, "regret": 0.35145509243011475, "entropy": 0.1329556554555893, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:05:47.685037Z", "loop": 2033, "env_steps": 1249689599, "loss": 0.0031351284123957157, "avg_return": 0.45230862498283386, "regret": 0.35145509243011475, "entropy": 0.13440535962581635, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:05:48.846629Z", "loop": 2034, "env_steps": 1250303999, "loss": 0.003064389107748866, "avg_return": 0.4538954794406891, "regret": 0.35145509243011475, "entropy": 0.1367623656988144, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:05:50.006783Z", "loop": 2035, "env_steps": 1250918399, "loss": 0.0033922381699085236, "avg_return": 0.4434628486633301, "regret": 0.35145509243011475, "entropy": 0.14162719249725342, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:05:51.167315Z", "loop": 2036, "env_steps": 1251532799, "loss": 0.0034707654267549515, "avg_return": 0.4484672248363495, "regret": 0.35145509243011475, "entropy": 0.13716696202754974, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:05:52.328630Z", "loop": 2037, "env_steps": 1252147199, "loss": 0.0043355319648981094, "avg_return": 0.4576115012168884, "regret": 0.35145509243011475, "entropy": 0.1394551396369934, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:05:53.488467Z", "loop": 2038, "env_steps": 1252761599, "loss": 0.004160958342254162, "avg_return": 0.44899487495422363, "regret": 0.35145509243011475, "entropy": 0.13945922255516052, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:05:54.649454Z", "loop": 2039, "env_steps": 1253375999, "loss": 0.004164300858974457, "avg_return": 0.4513884484767914, "regret": 0.35145509243011475, "entropy": 0.1400451362133026, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:05:55.854996Z", "loop": 2040, "env_steps": 1253990399, "loss": 0.004337613005191088, "avg_return": 0.4453014135360718, "regret": 0.35334059596061707, "entropy": 0.13098245859146118, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:05:57.016364Z", "loop": 2041, "env_steps": 1254604799, "loss": 0.004653220996260643, "avg_return": 0.45306533575057983, "regret": 0.35334059596061707, "entropy": 0.13360783457756042, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:05:58.177091Z", "loop": 2042, "env_steps": 1255219199, "loss": 0.0045595900155603886, "avg_return": 0.4536422789096832, "regret": 0.35334059596061707, "entropy": 0.12825949490070343, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:05:59.338015Z", "loop": 2043, "env_steps": 1255833599, "loss": 0.0044410075061023235, "avg_return": 0.45334485173225403, "regret": 0.35334059596061707, "entropy": 0.12674541771411896, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:06:00.501272Z", "loop": 2044, "env_steps": 1256447999, "loss": 0.004936255048960447, "avg_return": 0.4548202157020569, "regret": 0.35334059596061707, "entropy": 0.12703122198581696, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:06:01.663255Z", "loop": 2045, "env_steps": 1257062399, "loss": 0.003796972334384918, "avg_return": 0.44458842277526855, "regret": 0.35334059596061707, "entropy": 0.12262237817049026, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:06:02.828420Z", "loop": 2046, "env_steps": 1257676799, "loss": 0.0037537168245762587, "avg_return": 0.45477494597435, "regret": 0.35334059596061707, "entropy": 0.11793043464422226, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:06:03.994792Z", "loop": 2047, "env_steps": 1258291199, "loss": 0.00347936456091702, "avg_return": 0.44638195633888245, "regret": 0.35334059596061707, "entropy": 0.11918974667787552, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:06:05.156211Z", "loop": 2048, "env_steps": 1258905599, "loss": 0.0030116632115095854, "avg_return": 0.4618070125579834, "regret": 0.35334059596061707, "entropy": 0.12327031791210175, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:06:06.318512Z", "loop": 2049, "env_steps": 1259519999, "loss": 0.0027866456657648087, "avg_return": 0.4517487585544586, "regret": 0.35334059596061707, "entropy": 0.12426061928272247, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:06:07.528804Z", "loop": 2050, "env_steps": 1260134399, "loss": 0.0026895443443208933, "avg_return": 0.44882529973983765, "regret": 0.351979523897171, "entropy": 0.1319306343793869, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:06:08.690856Z", "loop": 2051, "env_steps": 1260748799, "loss": 0.002690464723855257, "avg_return": 0.450327605009079, "regret": 0.351979523897171, "entropy": 0.1270177811384201, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:06:09.852342Z", "loop": 2052, "env_steps": 1261363199, "loss": 0.0023644263856112957, "avg_return": 0.455396831035614, "regret": 0.351979523897171, "entropy": 0.11842993646860123, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:06:11.016412Z", "loop": 2053, "env_steps": 1261977599, "loss": 0.001619914430193603, "avg_return": 0.45165249705314636, "regret": 0.351979523897171, "entropy": 0.11361952126026154, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:06:12.182850Z", "loop": 2054, "env_steps": 1262591999, "loss": 0.0017303774366155267, "avg_return": 0.4535093307495117, "regret": 0.351979523897171, "entropy": 0.10806220769882202, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:06:13.344948Z", "loop": 2055, "env_steps": 1263206399, "loss": 0.0015251184813678265, "avg_return": 0.4490680694580078, "regret": 0.351979523897171, "entropy": 0.10765909403562546, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:06:14.505239Z", "loop": 2056, "env_steps": 1263820799, "loss": 0.00155638565775007, "avg_return": 0.44269582629203796, "regret": 0.351979523897171, "entropy": 0.1071620061993599, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:06:15.666212Z", "loop": 2057, "env_steps": 1264435199, "loss": 0.0014578532427549362, "avg_return": 0.4510180354118347, "regret": 0.351979523897171, "entropy": 0.10909876227378845, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:06:16.828336Z", "loop": 2058, "env_steps": 1265049599, "loss": 0.0015818020328879356, "avg_return": 0.4462275803089142, "regret": 0.351979523897171, "entropy": 0.10830982029438019, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:06:17.989460Z", "loop": 2059, "env_steps": 1265663999, "loss": 0.0016131805023178458, "avg_return": 0.44729411602020264, "regret": 0.351979523897171, "entropy": 0.10717646032571793, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:06:19.206795Z", "loop": 2060, "env_steps": 1266278399, "loss": 0.0016106375260278583, "avg_return": 0.45101410150527954, "regret": 0.3537449240684509, "entropy": 0.10531174391508102, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:06:20.370033Z", "loop": 2061, "env_steps": 1266892799, "loss": 0.0017676054267212749, "avg_return": 0.4520074427127838, "regret": 0.3537449240684509, "entropy": 0.10429301857948303, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:06:21.532583Z", "loop": 2062, "env_steps": 1267507199, "loss": 0.0019175315974280238, "avg_return": 0.45027124881744385, "regret": 0.3537449240684509, "entropy": 0.10653679072856903, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:06:22.694612Z", "loop": 2063, "env_steps": 1268121599, "loss": 0.001902453019283712, "avg_return": 0.4481268525123596, "regret": 0.3537449240684509, "entropy": 0.1147308498620987, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:06:23.854727Z", "loop": 2064, "env_steps": 1268735999, "loss": 0.0018964868504554033, "avg_return": 0.44749587774276733, "regret": 0.3537449240684509, "entropy": 0.10985160619020462, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:06:25.016803Z", "loop": 2065, "env_steps": 1269350399, "loss": 0.0020726853981614113, "avg_return": 0.4516896605491638, "regret": 0.3537449240684509, "entropy": 0.10871326178312302, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:06:26.181411Z", "loop": 2066, "env_steps": 1269964799, "loss": 0.0020081293769180775, "avg_return": 0.447983056306839, "regret": 0.3537449240684509, "entropy": 0.11715846508741379, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:06:27.344852Z", "loop": 2067, "env_steps": 1270579199, "loss": 0.0019153676694259048, "avg_return": 0.45000189542770386, "regret": 0.3537449240684509, "entropy": 0.11234927922487259, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:06:28.509479Z", "loop": 2068, "env_steps": 1271193599, "loss": 0.0017802605871111155, "avg_return": 0.45107895135879517, "regret": 0.3537449240684509, "entropy": 0.11542713642120361, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:06:29.670868Z", "loop": 2069, "env_steps": 1271807999, "loss": 0.0020472740288823843, "avg_return": 0.4535980224609375, "regret": 0.3537449240684509, "entropy": 0.11031003296375275, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:06:30.880492Z", "loop": 2070, "env_steps": 1272422399, "loss": 0.002002878114581108, "avg_return": 0.45487356185913086, "regret": 0.3519595265388489, "entropy": 0.10921556502580643, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:06:32.042223Z", "loop": 2071, "env_steps": 1273036799, "loss": 0.002012285403907299, "avg_return": 0.4514909088611603, "regret": 0.3519595265388489, "entropy": 0.10904228687286377, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:06:33.204347Z", "loop": 2072, "env_steps": 1273651199, "loss": 0.002078820252791047, "avg_return": 0.4534721076488495, "regret": 0.3519595265388489, "entropy": 0.1175466775894165, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:06:34.365330Z", "loop": 2073, "env_steps": 1274265599, "loss": 0.002020848449319601, "avg_return": 0.45717862248420715, "regret": 0.3519595265388489, "entropy": 0.11386197805404663, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:06:35.526366Z", "loop": 2074, "env_steps": 1274879999, "loss": 0.002012789947912097, "avg_return": 0.45689326524734497, "regret": 0.3519595265388489, "entropy": 0.11904345452785492, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:06:36.686896Z", "loop": 2075, "env_steps": 1275494399, "loss": 0.00236509763635695, "avg_return": 0.4566408395767212, "regret": 0.3519595265388489, "entropy": 0.11789680272340775, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:06:37.848363Z", "loop": 2076, "env_steps": 1276108799, "loss": 0.0023548367898911238, "avg_return": 0.4514389634132385, "regret": 0.3519595265388489, "entropy": 0.12308603525161743, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:06:39.011272Z", "loop": 2077, "env_steps": 1276723199, "loss": 0.0028184987604618073, "avg_return": 0.45242026448249817, "regret": 0.3519595265388489, "entropy": 0.13038194179534912, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:06:40.172017Z", "loop": 2078, "env_steps": 1277337599, "loss": 0.0031148192938417196, "avg_return": 0.4543990194797516, "regret": 0.3519595265388489, "entropy": 0.13667672872543335, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:06:41.333349Z", "loop": 2079, "env_steps": 1277951999, "loss": 0.0033523831516504288, "avg_return": 0.45189565420150757, "regret": 0.3519595265388489, "entropy": 0.1358761042356491, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:06:42.538419Z", "loop": 2080, "env_steps": 1278566399, "loss": 0.003592821303755045, "avg_return": 0.44301632046699524, "regret": 0.3527803122997284, "entropy": 0.14059890806674957, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:06:43.701932Z", "loop": 2081, "env_steps": 1279180799, "loss": 0.004051637835800648, "avg_return": 0.4469250738620758, "regret": 0.3527803122997284, "entropy": 0.13881680369377136, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:06:44.864469Z", "loop": 2082, "env_steps": 1279795199, "loss": 0.003587892046198249, "avg_return": 0.44933685660362244, "regret": 0.3527803122997284, "entropy": 0.13546960055828094, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:06:46.029741Z", "loop": 2083, "env_steps": 1280409599, "loss": 0.003957434091717005, "avg_return": 0.44591814279556274, "regret": 0.3527803122997284, "entropy": 0.1396627128124237, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:06:47.199429Z", "loop": 2084, "env_steps": 1281023999, "loss": 0.0037601336371153593, "avg_return": 0.446506142616272, "regret": 0.3527803122997284, "entropy": 0.13372895121574402, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:06:48.361213Z", "loop": 2085, "env_steps": 1281638399, "loss": 0.004020240157842636, "avg_return": 0.4460919201374054, "regret": 0.3527803122997284, "entropy": 0.13000577688217163, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:06:49.524806Z", "loop": 2086, "env_steps": 1282252799, "loss": 0.003680908353999257, "avg_return": 0.45232823491096497, "regret": 0.3527803122997284, "entropy": 0.13365548849105835, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:06:50.686262Z", "loop": 2087, "env_steps": 1282867199, "loss": 0.0031707596499472857, "avg_return": 0.45574459433555603, "regret": 0.3527803122997284, "entropy": 0.13485324382781982, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:06:51.846753Z", "loop": 2088, "env_steps": 1283481599, "loss": 0.003116734093055129, "avg_return": 0.4465128779411316, "regret": 0.3527803122997284, "entropy": 0.1271754503250122, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:06:53.006827Z", "loop": 2089, "env_steps": 1284095999, "loss": 0.0031531036365777254, "avg_return": 0.4510050415992737, "regret": 0.3527803122997284, "entropy": 0.12937484681606293, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:06:54.213379Z", "loop": 2090, "env_steps": 1284710399, "loss": 0.0027023376896977425, "avg_return": 0.4478888511657715, "regret": 0.35143646597862244, "entropy": 0.12619049847126007, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:06:55.375418Z", "loop": 2091, "env_steps": 1285324799, "loss": 0.0025281247217208147, "avg_return": 0.44668275117874146, "regret": 0.35143646597862244, "entropy": 0.12503494322299957, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:06:56.537198Z", "loop": 2092, "env_steps": 1285939199, "loss": 0.002450566738843918, "avg_return": 0.45281338691711426, "regret": 0.35143646597862244, "entropy": 0.11770762503147125, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:06:57.700046Z", "loop": 2093, "env_steps": 1286553599, "loss": 0.00215627858415246, "avg_return": 0.45243027806282043, "regret": 0.35143646597862244, "entropy": 0.11613566428422928, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:06:58.860635Z", "loop": 2094, "env_steps": 1287167999, "loss": 0.0018488895148038864, "avg_return": 0.44670066237449646, "regret": 0.35143646597862244, "entropy": 0.11358107626438141, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:07:00.021935Z", "loop": 2095, "env_steps": 1287782399, "loss": 0.0019365446642041206, "avg_return": 0.45404893159866333, "regret": 0.35143646597862244, "entropy": 0.11169983446598053, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:07:01.185692Z", "loop": 2096, "env_steps": 1288396799, "loss": 0.001905769924633205, "avg_return": 0.4509129524230957, "regret": 0.35143646597862244, "entropy": 0.10520792752504349, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:07:02.345001Z", "loop": 2097, "env_steps": 1289011199, "loss": 0.0014472076436504722, "avg_return": 0.44629842042922974, "regret": 0.35143646597862244, "entropy": 0.10318480432033539, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:07:03.510609Z", "loop": 2098, "env_steps": 1289625599, "loss": 0.0017988268518820405, "avg_return": 0.4577220380306244, "regret": 0.35143646597862244, "entropy": 0.10363191366195679, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:07:04.671494Z", "loop": 2099, "env_steps": 1290239999, "loss": 0.001675805076956749, "avg_return": 0.44556114077568054, "regret": 0.35143646597862244, "entropy": 0.11242931336164474, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:07:05.882390Z", "loop": 2100, "env_steps": 1290854399, "loss": 0.002197718946263194, "avg_return": 0.4489046335220337, "regret": 0.35441136360168457, "entropy": 0.109944187104702, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:07:07.043794Z", "loop": 2101, "env_steps": 1291468799, "loss": 0.002523034578189254, "avg_return": 0.4496646225452423, "regret": 0.35441136360168457, "entropy": 0.11646851152181625, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:07:08.204808Z", "loop": 2102, "env_steps": 1292083199, "loss": 0.002886129543185234, "avg_return": 0.4467427134513855, "regret": 0.35441136360168457, "entropy": 0.12533782422542572, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:07:09.367112Z", "loop": 2103, "env_steps": 1292697599, "loss": 0.003225464140996337, "avg_return": 0.4423680603504181, "regret": 0.35441136360168457, "entropy": 0.13491448760032654, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:07:10.528677Z", "loop": 2104, "env_steps": 1293311999, "loss": 0.0031871553510427475, "avg_return": 0.4474586546421051, "regret": 0.35441136360168457, "entropy": 0.13057953119277954, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:07:11.690720Z", "loop": 2105, "env_steps": 1293926399, "loss": 0.003359969472512603, "avg_return": 0.44571951031684875, "regret": 0.35441136360168457, "entropy": 0.13196322321891785, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:07:12.850961Z", "loop": 2106, "env_steps": 1294540799, "loss": 0.002735674614086747, "avg_return": 0.4448993504047394, "regret": 0.35441136360168457, "entropy": 0.13195614516735077, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:07:14.011820Z", "loop": 2107, "env_steps": 1295155199, "loss": 0.0027968487702310085, "avg_return": 0.45019084215164185, "regret": 0.35441136360168457, "entropy": 0.12171977758407593, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:07:15.171899Z", "loop": 2108, "env_steps": 1295769599, "loss": 0.002566020470112562, "avg_return": 0.4521763324737549, "regret": 0.35441136360168457, "entropy": 0.1155242919921875, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:07:16.332860Z", "loop": 2109, "env_steps": 1296383999, "loss": 0.001789370900951326, "avg_return": 0.45469728112220764, "regret": 0.35441136360168457, "entropy": 0.10911937803030014, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:07:17.545633Z", "loop": 2110, "env_steps": 1296998399, "loss": 0.0017918419325724244, "avg_return": 0.44554847478866577, "regret": 0.35274654626846313, "entropy": 0.11111738532781601, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:07:18.708488Z", "loop": 2111, "env_steps": 1297612799, "loss": 0.0018270250875502825, "avg_return": 0.445252388715744, "regret": 0.35274654626846313, "entropy": 0.10964111238718033, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:07:19.870629Z", "loop": 2112, "env_steps": 1298227199, "loss": 0.0023094667121767998, "avg_return": 0.45021575689315796, "regret": 0.35274654626846313, "entropy": 0.11619950085878372, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:07:21.031942Z", "loop": 2113, "env_steps": 1298841599, "loss": 0.0028152649756520987, "avg_return": 0.45472297072410583, "regret": 0.35274654626846313, "entropy": 0.12378456443548203, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:07:22.192943Z", "loop": 2114, "env_steps": 1299455999, "loss": 0.0023539187386631966, "avg_return": 0.4532604217529297, "regret": 0.35274654626846313, "entropy": 0.12259304523468018, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:07:23.357396Z", "loop": 2115, "env_steps": 1300070399, "loss": 0.0026870504952967167, "avg_return": 0.4496418237686157, "regret": 0.35274654626846313, "entropy": 0.11860765516757965, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:07:24.517789Z", "loop": 2116, "env_steps": 1300684799, "loss": 0.002961987629532814, "avg_return": 0.44807419180870056, "regret": 0.35274654626846313, "entropy": 0.11645079404115677, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:07:25.679290Z", "loop": 2117, "env_steps": 1301299199, "loss": 0.0035518088843673468, "avg_return": 0.44812339544296265, "regret": 0.35274654626846313, "entropy": 0.11293833702802658, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:07:26.839199Z", "loop": 2118, "env_steps": 1301913599, "loss": 0.004382855258882046, "avg_return": 0.44989192485809326, "regret": 0.35274654626846313, "entropy": 0.12161926180124283, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:07:27.999897Z", "loop": 2119, "env_steps": 1302527999, "loss": 0.004159192088991404, "avg_return": 0.4487174451351166, "regret": 0.35274654626846313, "entropy": 0.12039867788553238, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:07:29.213374Z", "loop": 2120, "env_steps": 1303142399, "loss": 0.004131023772060871, "avg_return": 0.43830886483192444, "regret": 0.3562135398387909, "entropy": 0.12069975584745407, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:07:30.374951Z", "loop": 2121, "env_steps": 1303756799, "loss": 0.003814257448539138, "avg_return": 0.4493636190891266, "regret": 0.3562135398387909, "entropy": 0.11669730395078659, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:07:31.535468Z", "loop": 2122, "env_steps": 1304371199, "loss": 0.0034016896970570087, "avg_return": 0.44584497809410095, "regret": 0.3562135398387909, "entropy": 0.11684556305408478, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:07:32.696183Z", "loop": 2123, "env_steps": 1304985599, "loss": 0.0031674837227910757, "avg_return": 0.45428767800331116, "regret": 0.3562135398387909, "entropy": 0.108519047498703, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:07:33.856105Z", "loop": 2124, "env_steps": 1305599999, "loss": 0.003013751469552517, "avg_return": 0.45596757531166077, "regret": 0.3562135398387909, "entropy": 0.11314672231674194, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:07:35.017299Z", "loop": 2125, "env_steps": 1306214399, "loss": 0.0027408089954406023, "avg_return": 0.4493487775325775, "regret": 0.3562135398387909, "entropy": 0.11235964298248291, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:07:36.179345Z", "loop": 2126, "env_steps": 1306828799, "loss": 0.002503177849575877, "avg_return": 0.44898632168769836, "regret": 0.3562135398387909, "entropy": 0.11781372129917145, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:07:37.339222Z", "loop": 2127, "env_steps": 1307443199, "loss": 0.002580873668193817, "avg_return": 0.4466124176979065, "regret": 0.3562135398387909, "entropy": 0.11818338185548782, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:07:38.501042Z", "loop": 2128, "env_steps": 1308057599, "loss": 0.0027366436552256346, "avg_return": 0.4513419568538666, "regret": 0.3562135398387909, "entropy": 0.11986508965492249, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:07:39.661214Z", "loop": 2129, "env_steps": 1308671999, "loss": 0.002759800059720874, "avg_return": 0.45093679428100586, "regret": 0.3562135398387909, "entropy": 0.12168967723846436, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:07:40.869409Z", "loop": 2130, "env_steps": 1309286399, "loss": 0.0025802336167544127, "avg_return": 0.4522422254085541, "regret": 0.3516462743282318, "entropy": 0.11535203456878662, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:07:42.032727Z", "loop": 2131, "env_steps": 1309900799, "loss": 0.0023980271071195602, "avg_return": 0.4504220187664032, "regret": 0.3516462743282318, "entropy": 0.12402701377868652, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:07:43.192881Z", "loop": 2132, "env_steps": 1310515199, "loss": 0.0023970480542629957, "avg_return": 0.4539221227169037, "regret": 0.3516462743282318, "entropy": 0.11944165825843811, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:07:44.352400Z", "loop": 2133, "env_steps": 1311129599, "loss": 0.00224197912029922, "avg_return": 0.4590018689632416, "regret": 0.3516462743282318, "entropy": 0.1132887601852417, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:07:45.512666Z", "loop": 2134, "env_steps": 1311743999, "loss": 0.0024204745423048735, "avg_return": 0.44679468870162964, "regret": 0.3516462743282318, "entropy": 0.1188880205154419, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:07:46.673934Z", "loop": 2135, "env_steps": 1312358399, "loss": 0.0024501297157257795, "avg_return": 0.45379915833473206, "regret": 0.3516462743282318, "entropy": 0.12111032754182816, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:07:47.834911Z", "loop": 2136, "env_steps": 1312972799, "loss": 0.002725572558119893, "avg_return": 0.4470697045326233, "regret": 0.3516462743282318, "entropy": 0.1261623650789261, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:07:48.996922Z", "loop": 2137, "env_steps": 1313587199, "loss": 0.0025798992719501257, "avg_return": 0.4490542709827423, "regret": 0.3516462743282318, "entropy": 0.1264248490333557, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:07:50.157876Z", "loop": 2138, "env_steps": 1314201599, "loss": 0.0027707002591341734, "avg_return": 0.4568749964237213, "regret": 0.3516462743282318, "entropy": 0.11420059949159622, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:07:51.319650Z", "loop": 2139, "env_steps": 1314815999, "loss": 0.002569640753790736, "avg_return": 0.45471569895744324, "regret": 0.3516462743282318, "entropy": 0.12065408378839493, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:07:52.533092Z", "loop": 2140, "env_steps": 1315430399, "loss": 0.0027700921054929495, "avg_return": 0.4583316743373871, "regret": 0.35145023465156555, "entropy": 0.11861468106508255, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:07:53.697867Z", "loop": 2141, "env_steps": 1316044799, "loss": 0.002753043547272682, "avg_return": 0.45162269473075867, "regret": 0.35145023465156555, "entropy": 0.11955643445253372, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:07:54.859415Z", "loop": 2142, "env_steps": 1316659199, "loss": 0.002809569938108325, "avg_return": 0.45473989844322205, "regret": 0.35145023465156555, "entropy": 0.11704941838979721, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:07:56.021353Z", "loop": 2143, "env_steps": 1317273599, "loss": 0.0028541572391986847, "avg_return": 0.46091803908348083, "regret": 0.35145023465156555, "entropy": 0.11711138486862183, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:07:57.184418Z", "loop": 2144, "env_steps": 1317887999, "loss": 0.0027668962720781565, "avg_return": 0.45135498046875, "regret": 0.35145023465156555, "entropy": 0.11780283600091934, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:07:58.345400Z", "loop": 2145, "env_steps": 1318502399, "loss": 0.0025566366966813803, "avg_return": 0.45148321986198425, "regret": 0.35145023465156555, "entropy": 0.12138618528842926, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:07:59.506348Z", "loop": 2146, "env_steps": 1319116799, "loss": 0.002887439215555787, "avg_return": 0.4562317132949829, "regret": 0.35145023465156555, "entropy": 0.117667555809021, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:08:00.667781Z", "loop": 2147, "env_steps": 1319731199, "loss": 0.0027407498564571142, "avg_return": 0.4526016414165497, "regret": 0.35145023465156555, "entropy": 0.11618869006633759, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:08:01.828054Z", "loop": 2148, "env_steps": 1320345599, "loss": 0.0028936872258782387, "avg_return": 0.45489275455474854, "regret": 0.35145023465156555, "entropy": 0.12147340178489685, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:08:02.990305Z", "loop": 2149, "env_steps": 1320959999, "loss": 0.002847792347893119, "avg_return": 0.4559519588947296, "regret": 0.35145023465156555, "entropy": 0.11795563995838165, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:08:04.198947Z", "loop": 2150, "env_steps": 1321574399, "loss": 0.0026711176615208387, "avg_return": 0.4548444151878357, "regret": 0.3514310419559479, "entropy": 0.12161016464233398, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:08:05.360538Z", "loop": 2151, "env_steps": 1322188799, "loss": 0.002700383309274912, "avg_return": 0.45980021357536316, "regret": 0.3514310419559479, "entropy": 0.11594752967357635, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:08:06.521047Z", "loop": 2152, "env_steps": 1322803199, "loss": 0.002251048106700182, "avg_return": 0.45093536376953125, "regret": 0.3514310419559479, "entropy": 0.11519911140203476, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:08:07.682955Z", "loop": 2153, "env_steps": 1323417599, "loss": 0.002073737559840083, "avg_return": 0.45791956782341003, "regret": 0.3514310419559479, "entropy": 0.11737526953220367, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:08:08.842759Z", "loop": 2154, "env_steps": 1324031999, "loss": 0.002153894631192088, "avg_return": 0.4526333808898926, "regret": 0.3514310419559479, "entropy": 0.11496119946241379, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:08:10.002001Z", "loop": 2155, "env_steps": 1324646399, "loss": 0.002312389900907874, "avg_return": 0.4517364203929901, "regret": 0.3514310419559479, "entropy": 0.11096163094043732, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:08:11.160952Z", "loop": 2156, "env_steps": 1325260799, "loss": 0.0026813435833901167, "avg_return": 0.4491984248161316, "regret": 0.3514310419559479, "entropy": 0.12003711611032486, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:08:12.320350Z", "loop": 2157, "env_steps": 1325875199, "loss": 0.002481981413438916, "avg_return": 0.44413697719573975, "regret": 0.3514310419559479, "entropy": 0.12306959182024002, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:08:13.480842Z", "loop": 2158, "env_steps": 1326489599, "loss": 0.002582268789410591, "avg_return": 0.45015981793403625, "regret": 0.3514310419559479, "entropy": 0.1199578195810318, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:08:14.640375Z", "loop": 2159, "env_steps": 1327103999, "loss": 0.0024940429721027613, "avg_return": 0.4452475607395172, "regret": 0.3514310419559479, "entropy": 0.11989366263151169, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:08:15.844698Z", "loop": 2160, "env_steps": 1327718399, "loss": 0.002570213284343481, "avg_return": 0.45371899008750916, "regret": 0.3515087068080902, "entropy": 0.11369282007217407, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:08:17.005454Z", "loop": 2161, "env_steps": 1328332799, "loss": 0.0025540299247950315, "avg_return": 0.45135921239852905, "regret": 0.3515087068080902, "entropy": 0.11743230372667313, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:08:18.166585Z", "loop": 2162, "env_steps": 1328947199, "loss": 0.002472288440912962, "avg_return": 0.45057815313339233, "regret": 0.3515087068080902, "entropy": 0.11529474705457687, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:08:19.325281Z", "loop": 2163, "env_steps": 1329561599, "loss": 0.0023239976726472378, "avg_return": 0.4499170482158661, "regret": 0.3515087068080902, "entropy": 0.12015081197023392, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:08:20.485448Z", "loop": 2164, "env_steps": 1330175999, "loss": 0.0026087441947311163, "avg_return": 0.4550474286079407, "regret": 0.3515087068080902, "entropy": 0.1157192811369896, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:08:21.645362Z", "loop": 2165, "env_steps": 1330790399, "loss": 0.0026870404835790396, "avg_return": 0.44808223843574524, "regret": 0.3515087068080902, "entropy": 0.11854211986064911, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:08:22.805077Z", "loop": 2166, "env_steps": 1331404799, "loss": 0.002854202641174197, "avg_return": 0.45037877559661865, "regret": 0.3515087068080902, "entropy": 0.11689507961273193, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:08:23.966916Z", "loop": 2167, "env_steps": 1332019199, "loss": 0.0026252768002450466, "avg_return": 0.44946184754371643, "regret": 0.3515087068080902, "entropy": 0.11084331572055817, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:08:25.126122Z", "loop": 2168, "env_steps": 1332633599, "loss": 0.003045580117031932, "avg_return": 0.45051485300064087, "regret": 0.3515087068080902, "entropy": 0.11801294982433319, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:08:26.287754Z", "loop": 2169, "env_steps": 1333247999, "loss": 0.0028463497292250395, "avg_return": 0.45594677329063416, "regret": 0.3515087068080902, "entropy": 0.11644246429204941, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:08:27.495326Z", "loop": 2170, "env_steps": 1333862399, "loss": 0.0029345396906137466, "avg_return": 0.45003369450569153, "regret": 0.3517778515815735, "entropy": 0.11697127670049667, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:08:28.659390Z", "loop": 2171, "env_steps": 1334476799, "loss": 0.003060300135985017, "avg_return": 0.45587363839149475, "regret": 0.3517778515815735, "entropy": 0.1144912913441658, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:08:29.819465Z", "loop": 2172, "env_steps": 1335091199, "loss": 0.0029594150837510824, "avg_return": 0.4429362118244171, "regret": 0.3517778515815735, "entropy": 0.1184336245059967, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:08:30.989145Z", "loop": 2173, "env_steps": 1335705599, "loss": 0.0032500249799340963, "avg_return": 0.4605658948421478, "regret": 0.3517778515815735, "entropy": 0.11109762638807297, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:08:32.156103Z", "loop": 2174, "env_steps": 1336319999, "loss": 0.003276590257883072, "avg_return": 0.4466557502746582, "regret": 0.3517778515815735, "entropy": 0.11734290421009064, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:08:33.323301Z", "loop": 2175, "env_steps": 1336934399, "loss": 0.0032268327195197344, "avg_return": 0.4564688205718994, "regret": 0.3517778515815735, "entropy": 0.11069297045469284, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:08:34.485572Z", "loop": 2176, "env_steps": 1337548799, "loss": 0.0031417941208928823, "avg_return": 0.4589415490627289, "regret": 0.3517778515815735, "entropy": 0.11788351833820343, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:08:35.645570Z", "loop": 2177, "env_steps": 1338163199, "loss": 0.002913363976404071, "avg_return": 0.44494107365608215, "regret": 0.3517778515815735, "entropy": 0.11105102300643921, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:08:36.806437Z", "loop": 2178, "env_steps": 1338777599, "loss": 0.0032467034179717302, "avg_return": 0.4488338828086853, "regret": 0.3517778515815735, "entropy": 0.11972812563180923, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:08:37.967904Z", "loop": 2179, "env_steps": 1339391999, "loss": 0.0035165424924343824, "avg_return": 0.45494547486305237, "regret": 0.3517778515815735, "entropy": 0.12448202073574066, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:08:39.193411Z", "loop": 2180, "env_steps": 1340006399, "loss": 0.0030307206325232983, "avg_return": 0.4477050304412842, "regret": 0.35228705406188965, "entropy": 0.11709438264369965, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:08:40.359055Z", "loop": 2181, "env_steps": 1340620799, "loss": 0.0028789485804736614, "avg_return": 0.4517577290534973, "regret": 0.35228705406188965, "entropy": 0.12060628831386566, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:08:41.521074Z", "loop": 2182, "env_steps": 1341235199, "loss": 0.0031509336549788713, "avg_return": 0.45373621582984924, "regret": 0.35228705406188965, "entropy": 0.11967609077692032, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:08:42.683518Z", "loop": 2183, "env_steps": 1341849599, "loss": 0.0028559621423482895, "avg_return": 0.45852020382881165, "regret": 0.35228705406188965, "entropy": 0.12000024318695068, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:08:43.849855Z", "loop": 2184, "env_steps": 1342463999, "loss": 0.0030976030975580215, "avg_return": 0.4514300525188446, "regret": 0.35228705406188965, "entropy": 0.11472705751657486, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:08:45.010984Z", "loop": 2185, "env_steps": 1343078399, "loss": 0.002727136015892029, "avg_return": 0.4486985504627228, "regret": 0.35228705406188965, "entropy": 0.12694387137889862, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:08:46.171337Z", "loop": 2186, "env_steps": 1343692799, "loss": 0.00271093868650496, "avg_return": 0.4520386755466461, "regret": 0.35228705406188965, "entropy": 0.12094218283891678, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:08:47.330769Z", "loop": 2187, "env_steps": 1344307199, "loss": 0.0023265534546226263, "avg_return": 0.45152679085731506, "regret": 0.35228705406188965, "entropy": 0.11617475003004074, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:08:48.491837Z", "loop": 2188, "env_steps": 1344921599, "loss": 0.002309245290234685, "avg_return": 0.4528227746486664, "regret": 0.35228705406188965, "entropy": 0.12104609608650208, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:08:49.653179Z", "loop": 2189, "env_steps": 1345535999, "loss": 0.0025043783243745565, "avg_return": 0.4506341516971588, "regret": 0.35228705406188965, "entropy": 0.1173786073923111, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:08:50.867998Z", "loop": 2190, "env_steps": 1346150399, "loss": 0.002632003277540207, "avg_return": 0.454609751701355, "regret": 0.35139909386634827, "entropy": 0.11783003807067871, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:08:52.032198Z", "loop": 2191, "env_steps": 1346764799, "loss": 0.0022905475925654173, "avg_return": 0.44878092408180237, "regret": 0.35139909386634827, "entropy": 0.11370449513196945, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:08:53.192657Z", "loop": 2192, "env_steps": 1347379199, "loss": 0.002273155376315117, "avg_return": 0.4464288353919983, "regret": 0.35139909386634827, "entropy": 0.11188864707946777, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:08:54.354261Z", "loop": 2193, "env_steps": 1347993599, "loss": 0.002098250202834606, "avg_return": 0.4505936801433563, "regret": 0.35139909386634827, "entropy": 0.10164107382297516, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:08:55.514493Z", "loop": 2194, "env_steps": 1348607999, "loss": 0.0018752965843304992, "avg_return": 0.4510903060436249, "regret": 0.35139909386634827, "entropy": 0.10568995028734207, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:08:56.674663Z", "loop": 2195, "env_steps": 1349222399, "loss": 0.001866934821009636, "avg_return": 0.4456920623779297, "regret": 0.35139909386634827, "entropy": 0.10796884447336197, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:08:57.836798Z", "loop": 2196, "env_steps": 1349836799, "loss": 0.0021156813018023968, "avg_return": 0.4583798348903656, "regret": 0.35139909386634827, "entropy": 0.10489577054977417, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:08:58.997040Z", "loop": 2197, "env_steps": 1350451199, "loss": 0.0024279518984258175, "avg_return": 0.4481692612171173, "regret": 0.35139909386634827, "entropy": 0.10742699354887009, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:09:00.158971Z", "loop": 2198, "env_steps": 1351065599, "loss": 0.0025236119981855154, "avg_return": 0.4511480927467346, "regret": 0.35139909386634827, "entropy": 0.11083324998617172, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:09:01.320823Z", "loop": 2199, "env_steps": 1351679999, "loss": 0.0027842880226671696, "avg_return": 0.4492805600166321, "regret": 0.35139909386634827, "entropy": 0.11716776341199875, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:09:02.533686Z", "loop": 2200, "env_steps": 1352294399, "loss": 0.0027209098916500807, "avg_return": 0.4506825804710388, "regret": 0.3535948097705841, "entropy": 0.11129813641309738, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:09:03.696655Z", "loop": 2201, "env_steps": 1352908799, "loss": 0.0029850744176656008, "avg_return": 0.44949841499328613, "regret": 0.3535948097705841, "entropy": 0.11672578752040863, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:09:04.859408Z", "loop": 2202, "env_steps": 1353523199, "loss": 0.002650790149345994, "avg_return": 0.4484230577945709, "regret": 0.3535948097705841, "entropy": 0.11704947054386139, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:09:06.026570Z", "loop": 2203, "env_steps": 1354137599, "loss": 0.002516315318644047, "avg_return": 0.4540015161037445, "regret": 0.3535948097705841, "entropy": 0.11181604862213135, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:09:07.187242Z", "loop": 2204, "env_steps": 1354751999, "loss": 0.0025608644355088472, "avg_return": 0.45028483867645264, "regret": 0.3535948097705841, "entropy": 0.1117892786860466, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:09:08.348827Z", "loop": 2205, "env_steps": 1355366399, "loss": 0.002430071821436286, "avg_return": 0.4467887878417969, "regret": 0.3535948097705841, "entropy": 0.11226832121610641, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:09:09.508774Z", "loop": 2206, "env_steps": 1355980799, "loss": 0.0027516386471688747, "avg_return": 0.4568994343280792, "regret": 0.3535948097705841, "entropy": 0.11546070128679276, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:09:10.670398Z", "loop": 2207, "env_steps": 1356595199, "loss": 0.003132810816168785, "avg_return": 0.4530319273471832, "regret": 0.3535948097705841, "entropy": 0.1132100448012352, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:09:11.832301Z", "loop": 2208, "env_steps": 1357209599, "loss": 0.0030525345355272293, "avg_return": 0.45218583941459656, "regret": 0.3535948097705841, "entropy": 0.11363091319799423, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:09:12.993655Z", "loop": 2209, "env_steps": 1357823999, "loss": 0.0026707814540714025, "avg_return": 0.448337197303772, "regret": 0.3535948097705841, "entropy": 0.1160695031285286, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:09:14.202196Z", "loop": 2210, "env_steps": 1358438399, "loss": 0.0022185274865478277, "avg_return": 0.4535146653652191, "regret": 0.351703017950058, "entropy": 0.11155559867620468, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:09:15.363977Z", "loop": 2211, "env_steps": 1359052799, "loss": 0.0020699743181467056, "avg_return": 0.44731780886650085, "regret": 0.351703017950058, "entropy": 0.10443122684955597, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:09:16.525611Z", "loop": 2212, "env_steps": 1359667199, "loss": 0.0019745323807001114, "avg_return": 0.45324447751045227, "regret": 0.351703017950058, "entropy": 0.10720175504684448, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:09:17.685748Z", "loop": 2213, "env_steps": 1360281599, "loss": 0.0019023333443328738, "avg_return": 0.4509936571121216, "regret": 0.351703017950058, "entropy": 0.11251867562532425, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:09:18.847119Z", "loop": 2214, "env_steps": 1360895999, "loss": 0.002254347549751401, "avg_return": 0.45480892062187195, "regret": 0.351703017950058, "entropy": 0.11090700328350067, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:09:20.012809Z", "loop": 2215, "env_steps": 1361510399, "loss": 0.0025311352219432592, "avg_return": 0.45533397793769836, "regret": 0.351703017950058, "entropy": 0.12398774921894073, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:09:21.174239Z", "loop": 2216, "env_steps": 1362124799, "loss": 0.0027467573527246714, "avg_return": 0.45359817147254944, "regret": 0.351703017950058, "entropy": 0.12716098129749298, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:09:22.335556Z", "loop": 2217, "env_steps": 1362739199, "loss": 0.0028846156783401966, "avg_return": 0.4497825801372528, "regret": 0.351703017950058, "entropy": 0.13014571368694305, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:09:23.496329Z", "loop": 2218, "env_steps": 1363353599, "loss": 0.002976273884996772, "avg_return": 0.4463880956172943, "regret": 0.351703017950058, "entropy": 0.12958787381649017, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:09:24.659902Z", "loop": 2219, "env_steps": 1363967999, "loss": 0.003636430250480771, "avg_return": 0.46200358867645264, "regret": 0.351703017950058, "entropy": 0.13094112277030945, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:09:25.869115Z", "loop": 2220, "env_steps": 1364582399, "loss": 0.0034351092763245106, "avg_return": 0.4480021893978119, "regret": 0.352703332901001, "entropy": 0.12930889427661896, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:09:27.032052Z", "loop": 2221, "env_steps": 1365196799, "loss": 0.00309556070715189, "avg_return": 0.4453183114528656, "regret": 0.352703332901001, "entropy": 0.1243315041065216, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:09:28.193844Z", "loop": 2222, "env_steps": 1365811199, "loss": 0.0033462406136095524, "avg_return": 0.4485473334789276, "regret": 0.352703332901001, "entropy": 0.12407641112804413, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:09:29.354214Z", "loop": 2223, "env_steps": 1366425599, "loss": 0.0034992084838449955, "avg_return": 0.4540986716747284, "regret": 0.352703332901001, "entropy": 0.11868714541196823, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:09:30.514934Z", "loop": 2224, "env_steps": 1367039999, "loss": 0.003141472116112709, "avg_return": 0.4529764950275421, "regret": 0.352703332901001, "entropy": 0.12194384634494781, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:09:31.676442Z", "loop": 2225, "env_steps": 1367654399, "loss": 0.0026339890900999308, "avg_return": 0.4505782723426819, "regret": 0.352703332901001, "entropy": 0.12244335561990738, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:09:32.837704Z", "loop": 2226, "env_steps": 1368268799, "loss": 0.002770826919004321, "avg_return": 0.4514065682888031, "regret": 0.352703332901001, "entropy": 0.12549203634262085, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:09:33.998638Z", "loop": 2227, "env_steps": 1368883199, "loss": 0.002828756347298622, "avg_return": 0.45634767413139343, "regret": 0.352703332901001, "entropy": 0.12262625247240067, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:09:35.159368Z", "loop": 2228, "env_steps": 1369497599, "loss": 0.0029724480118602514, "avg_return": 0.45391562581062317, "regret": 0.352703332901001, "entropy": 0.12479189038276672, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:09:36.319447Z", "loop": 2229, "env_steps": 1370111999, "loss": 0.0025207323487848043, "avg_return": 0.44929760694503784, "regret": 0.352703332901001, "entropy": 0.1257372349500656, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:09:37.529218Z", "loop": 2230, "env_steps": 1370726399, "loss": 0.0029960039537400007, "avg_return": 0.4510655701160431, "regret": 0.351550430059433, "entropy": 0.12336116284132004, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:09:38.695472Z", "loop": 2231, "env_steps": 1371340799, "loss": 0.0026186411269009113, "avg_return": 0.45120394229888916, "regret": 0.351550430059433, "entropy": 0.12407836318016052, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:09:39.856095Z", "loop": 2232, "env_steps": 1371955199, "loss": 0.0029437525663524866, "avg_return": 0.446677565574646, "regret": 0.351550430059433, "entropy": 0.13088952004909515, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:09:41.017785Z", "loop": 2233, "env_steps": 1372569599, "loss": 0.002473743399605155, "avg_return": 0.4525776207447052, "regret": 0.351550430059433, "entropy": 0.12362505495548248, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:09:42.178516Z", "loop": 2234, "env_steps": 1373183999, "loss": 0.0029027618002146482, "avg_return": 0.4557262659072876, "regret": 0.351550430059433, "entropy": 0.12458553910255432, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:09:43.340944Z", "loop": 2235, "env_steps": 1373798399, "loss": 0.002721836557611823, "avg_return": 0.451575368642807, "regret": 0.351550430059433, "entropy": 0.12288056313991547, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:09:44.500867Z", "loop": 2236, "env_steps": 1374412799, "loss": 0.0026954880449920893, "avg_return": 0.4536801874637604, "regret": 0.351550430059433, "entropy": 0.11687012016773224, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:09:45.662243Z", "loop": 2237, "env_steps": 1375027199, "loss": 0.002786164404824376, "avg_return": 0.4514714777469635, "regret": 0.351550430059433, "entropy": 0.11981123685836792, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:09:46.827861Z", "loop": 2238, "env_steps": 1375641599, "loss": 0.0023018268402665854, "avg_return": 0.44966813921928406, "regret": 0.351550430059433, "entropy": 0.11985092610120773, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:09:47.989151Z", "loop": 2239, "env_steps": 1376255999, "loss": 0.0020393095910549164, "avg_return": 0.45432332158088684, "regret": 0.351550430059433, "entropy": 0.11504244804382324, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:09:49.201462Z", "loop": 2240, "env_steps": 1376870399, "loss": 0.001977174310013652, "avg_return": 0.44621899724006653, "regret": 0.3512552082538605, "entropy": 0.10667198151350021, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:09:50.362484Z", "loop": 2241, "env_steps": 1377484799, "loss": 0.0020977419335395098, "avg_return": 0.4472653269767761, "regret": 0.3512552082538605, "entropy": 0.11165441572666168, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:09:51.523955Z", "loop": 2242, "env_steps": 1378099199, "loss": 0.0017774797743186355, "avg_return": 0.4444190561771393, "regret": 0.3512552082538605, "entropy": 0.11111032217741013, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:09:52.685933Z", "loop": 2243, "env_steps": 1378713599, "loss": 0.0019470517290756106, "avg_return": 0.45892611145973206, "regret": 0.3512552082538605, "entropy": 0.10696598887443542, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:09:53.848537Z", "loop": 2244, "env_steps": 1379327999, "loss": 0.0022544313687831163, "avg_return": 0.4440830647945404, "regret": 0.3512552082538605, "entropy": 0.11293245106935501, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:09:55.011516Z", "loop": 2245, "env_steps": 1379942399, "loss": 0.0024366036523133516, "avg_return": 0.45340728759765625, "regret": 0.3512552082538605, "entropy": 0.11831584572792053, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:09:56.173014Z", "loop": 2246, "env_steps": 1380556799, "loss": 0.0023641688749194145, "avg_return": 0.4550565779209137, "regret": 0.3512552082538605, "entropy": 0.11690369248390198, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:09:57.335331Z", "loop": 2247, "env_steps": 1381171199, "loss": 0.0026016475167125463, "avg_return": 0.4527125060558319, "regret": 0.3512552082538605, "entropy": 0.1195714995265007, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:09:58.496062Z", "loop": 2248, "env_steps": 1381785599, "loss": 0.0024497429840266705, "avg_return": 0.44650065898895264, "regret": 0.3512552082538605, "entropy": 0.1161491796374321, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:09:59.657063Z", "loop": 2249, "env_steps": 1382399999, "loss": 0.002415698254480958, "avg_return": 0.4495681822299957, "regret": 0.3512552082538605, "entropy": 0.1183280274271965, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:10:00.864304Z", "loop": 2250, "env_steps": 1383014399, "loss": 0.002730936510488391, "avg_return": 0.44423797726631165, "regret": 0.35177043080329895, "entropy": 0.11844507604837418, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:10:02.024691Z", "loop": 2251, "env_steps": 1383628799, "loss": 0.0025327166076749563, "avg_return": 0.45202821493148804, "regret": 0.35177043080329895, "entropy": 0.11701441556215286, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:10:03.184045Z", "loop": 2252, "env_steps": 1384243199, "loss": 0.0027030492201447487, "avg_return": 0.45777085423469543, "regret": 0.35177043080329895, "entropy": 0.11416181176900864, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:10:04.343704Z", "loop": 2253, "env_steps": 1384857599, "loss": 0.002881541382521391, "avg_return": 0.4561771750450134, "regret": 0.35177043080329895, "entropy": 0.11353699862957001, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:10:05.503816Z", "loop": 2254, "env_steps": 1385471999, "loss": 0.003121901536360383, "avg_return": 0.4557218551635742, "regret": 0.35177043080329895, "entropy": 0.11487463861703873, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:10:06.663365Z", "loop": 2255, "env_steps": 1386086399, "loss": 0.0028449518140405416, "avg_return": 0.45651522278785706, "regret": 0.35177043080329895, "entropy": 0.1251320093870163, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:10:07.823860Z", "loop": 2256, "env_steps": 1386700799, "loss": 0.0024413294158875942, "avg_return": 0.4547138512134552, "regret": 0.35177043080329895, "entropy": 0.11506271362304688, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:10:08.982758Z", "loop": 2257, "env_steps": 1387315199, "loss": 0.002423250814899802, "avg_return": 0.4499145746231079, "regret": 0.35177043080329895, "entropy": 0.11255655437707901, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:10:10.144188Z", "loop": 2258, "env_steps": 1387929599, "loss": 0.0024370769970119, "avg_return": 0.45749542117118835, "regret": 0.35177043080329895, "entropy": 0.10926803201436996, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:10:11.303472Z", "loop": 2259, "env_steps": 1388543999, "loss": 0.0022872856352478266, "avg_return": 0.45200520753860474, "regret": 0.35177043080329895, "entropy": 0.11621669679880142, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:10:12.507833Z", "loop": 2260, "env_steps": 1389158399, "loss": 0.002678847638890147, "avg_return": 0.4577312469482422, "regret": 0.35122910141944885, "entropy": 0.11548691987991333, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:10:13.669416Z", "loop": 2261, "env_steps": 1389772799, "loss": 0.002195381559431553, "avg_return": 0.4527977705001831, "regret": 0.35122910141944885, "entropy": 0.11002829670906067, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:10:14.830349Z", "loop": 2262, "env_steps": 1390387199, "loss": 0.002018008381128311, "avg_return": 0.4536144733428955, "regret": 0.35122910141944885, "entropy": 0.10560969263315201, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:10:15.989037Z", "loop": 2263, "env_steps": 1391001599, "loss": 0.0019066029926761985, "avg_return": 0.44619014859199524, "regret": 0.35122910141944885, "entropy": 0.1033986285328865, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:10:17.148437Z", "loop": 2264, "env_steps": 1391615999, "loss": 0.0017108211759477854, "avg_return": 0.4535404443740845, "regret": 0.35122910141944885, "entropy": 0.10993003100156784, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:10:18.308897Z", "loop": 2265, "env_steps": 1392230399, "loss": 0.0022604293189942837, "avg_return": 0.45040395855903625, "regret": 0.35122910141944885, "entropy": 0.10903983563184738, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:10:19.469015Z", "loop": 2266, "env_steps": 1392844799, "loss": 0.002961481222882867, "avg_return": 0.45769360661506653, "regret": 0.35122910141944885, "entropy": 0.11757949739694595, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:10:20.631442Z", "loop": 2267, "env_steps": 1393459199, "loss": 0.0024866347666829824, "avg_return": 0.4494633078575134, "regret": 0.35122910141944885, "entropy": 0.11915862560272217, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:10:21.791449Z", "loop": 2268, "env_steps": 1394073599, "loss": 0.002957965014502406, "avg_return": 0.4494500756263733, "regret": 0.35122910141944885, "entropy": 0.11526214331388474, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:10:22.951329Z", "loop": 2269, "env_steps": 1394687999, "loss": 0.0027497478295117617, "avg_return": 0.45251527428627014, "regret": 0.35122910141944885, "entropy": 0.12184692174196243, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:10:24.157154Z", "loop": 2270, "env_steps": 1395302399, "loss": 0.0028293041978031397, "avg_return": 0.44140830636024475, "regret": 0.3533434569835663, "entropy": 0.12493094801902771, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:10:25.317509Z", "loop": 2271, "env_steps": 1395916799, "loss": 0.002670577960088849, "avg_return": 0.4497690796852112, "regret": 0.3533434569835663, "entropy": 0.11660079658031464, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:10:26.476249Z", "loop": 2272, "env_steps": 1396531199, "loss": 0.0028988178819417953, "avg_return": 0.4596433639526367, "regret": 0.3533434569835663, "entropy": 0.11636859178543091, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:10:27.635955Z", "loop": 2273, "env_steps": 1397145599, "loss": 0.0029122165869921446, "avg_return": 0.45178690552711487, "regret": 0.3533434569835663, "entropy": 0.11944960057735443, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:10:28.795235Z", "loop": 2274, "env_steps": 1397759999, "loss": 0.0026410433929413557, "avg_return": 0.4492819309234619, "regret": 0.3533434569835663, "entropy": 0.11530888080596924, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:10:29.956820Z", "loop": 2275, "env_steps": 1398374399, "loss": 0.0025035685393959284, "avg_return": 0.44680339097976685, "regret": 0.3533434569835663, "entropy": 0.11902590095996857, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:10:31.120824Z", "loop": 2276, "env_steps": 1398988799, "loss": 0.0022585010156035423, "avg_return": 0.4567945897579193, "regret": 0.3533434569835663, "entropy": 0.11353784054517746, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:10:32.280098Z", "loop": 2277, "env_steps": 1399603199, "loss": 0.0026092820335179567, "avg_return": 0.4553564190864563, "regret": 0.3533434569835663, "entropy": 0.11421872675418854, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:10:33.442489Z", "loop": 2278, "env_steps": 1400217599, "loss": 0.0025790887884795666, "avg_return": 0.44840389490127563, "regret": 0.3533434569835663, "entropy": 0.10958301275968552, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:10:34.608111Z", "loop": 2279, "env_steps": 1400831999, "loss": 0.002823200775310397, "avg_return": 0.4575226306915283, "regret": 0.3533434569835663, "entropy": 0.11278020590543747, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:10:35.825793Z", "loop": 2280, "env_steps": 1401446399, "loss": 0.0026783093344420195, "avg_return": 0.46048253774642944, "regret": 0.35176509618759155, "entropy": 0.11325019598007202, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:10:36.996628Z", "loop": 2281, "env_steps": 1402060799, "loss": 0.002484445460140705, "avg_return": 0.4534885287284851, "regret": 0.35176509618759155, "entropy": 0.11119270324707031, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:10:38.155806Z", "loop": 2282, "env_steps": 1402675199, "loss": 0.002616641577333212, "avg_return": 0.44735679030418396, "regret": 0.35176509618759155, "entropy": 0.11110012233257294, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:10:39.317393Z", "loop": 2283, "env_steps": 1403289599, "loss": 0.0024683091323822737, "avg_return": 0.44927695393562317, "regret": 0.35176509618759155, "entropy": 0.11843763291835785, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:10:40.478209Z", "loop": 2284, "env_steps": 1403903999, "loss": 0.002090655965730548, "avg_return": 0.4499906003475189, "regret": 0.35176509618759155, "entropy": 0.11166706681251526, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:10:41.639403Z", "loop": 2285, "env_steps": 1404518399, "loss": 0.0022167363204061985, "avg_return": 0.4590889513492584, "regret": 0.35176509618759155, "entropy": 0.10657566785812378, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:10:42.800936Z", "loop": 2286, "env_steps": 1405132799, "loss": 0.0022656007204204798, "avg_return": 0.45334675908088684, "regret": 0.35176509618759155, "entropy": 0.11311831325292587, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:10:43.961107Z", "loop": 2287, "env_steps": 1405747199, "loss": 0.001866595121100545, "avg_return": 0.4560944139957428, "regret": 0.35176509618759155, "entropy": 0.11141156405210495, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:10:45.122040Z", "loop": 2288, "env_steps": 1406361599, "loss": 0.002024017972871661, "avg_return": 0.4504218101501465, "regret": 0.35176509618759155, "entropy": 0.10735200345516205, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:10:46.281878Z", "loop": 2289, "env_steps": 1406975999, "loss": 0.0022030207328498363, "avg_return": 0.4511352777481079, "regret": 0.35176509618759155, "entropy": 0.11965741217136383, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:10:47.488289Z", "loop": 2290, "env_steps": 1407590399, "loss": 0.0024542936589568853, "avg_return": 0.44886669516563416, "regret": 0.3511050045490265, "entropy": 0.12009680271148682, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:10:48.647811Z", "loop": 2291, "env_steps": 1408204799, "loss": 0.002729327417910099, "avg_return": 0.44709306955337524, "regret": 0.3511050045490265, "entropy": 0.11923923343420029, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:10:49.809423Z", "loop": 2292, "env_steps": 1408819199, "loss": 0.0027760653756558895, "avg_return": 0.45583730936050415, "regret": 0.3511050045490265, "entropy": 0.12050699442625046, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:10:50.970284Z", "loop": 2293, "env_steps": 1409433599, "loss": 0.0026196304243057966, "avg_return": 0.4456472396850586, "regret": 0.3511050045490265, "entropy": 0.12308717519044876, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:10:52.131955Z", "loop": 2294, "env_steps": 1410047999, "loss": 0.0028032087720930576, "avg_return": 0.4531914293766022, "regret": 0.3511050045490265, "entropy": 0.11931031197309494, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:10:53.293937Z", "loop": 2295, "env_steps": 1410662399, "loss": 0.002709930529817939, "avg_return": 0.4567308723926544, "regret": 0.3511050045490265, "entropy": 0.11908794194459915, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:10:54.454081Z", "loop": 2296, "env_steps": 1411276799, "loss": 0.0031624098774045706, "avg_return": 0.4495706260204315, "regret": 0.3511050045490265, "entropy": 0.12046533823013306, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:10:55.614692Z", "loop": 2297, "env_steps": 1411891199, "loss": 0.003288848325610161, "avg_return": 0.4515998363494873, "regret": 0.3511050045490265, "entropy": 0.12040933966636658, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:10:56.774645Z", "loop": 2298, "env_steps": 1412505599, "loss": 0.003287883475422859, "avg_return": 0.4493764340877533, "regret": 0.3511050045490265, "entropy": 0.11692321300506592, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:10:57.934558Z", "loop": 2299, "env_steps": 1413119999, "loss": 0.0036963508464396, "avg_return": 0.4575783312320709, "regret": 0.3511050045490265, "entropy": 0.11246205121278763, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:10:59.140534Z", "loop": 2300, "env_steps": 1413734399, "loss": 0.0036856525111943483, "avg_return": 0.44477999210357666, "regret": 0.3546040654182434, "entropy": 0.1172172799706459, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:11:00.310654Z", "loop": 2301, "env_steps": 1414348799, "loss": 0.003604208817705512, "avg_return": 0.45024019479751587, "regret": 0.3546040654182434, "entropy": 0.11651791632175446, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:11:01.473315Z", "loop": 2302, "env_steps": 1414963199, "loss": 0.0036065310705453157, "avg_return": 0.4494091272354126, "regret": 0.3546040654182434, "entropy": 0.11270240694284439, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:11:02.633757Z", "loop": 2303, "env_steps": 1415577599, "loss": 0.003939156886190176, "avg_return": 0.45332804322242737, "regret": 0.3546040654182434, "entropy": 0.10864460468292236, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:11:03.795084Z", "loop": 2304, "env_steps": 1416191999, "loss": 0.0037392990197986364, "avg_return": 0.44524243474006653, "regret": 0.3546040654182434, "entropy": 0.11040020734071732, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:11:04.955415Z", "loop": 2305, "env_steps": 1416806399, "loss": 0.003927983809262514, "avg_return": 0.44443878531455994, "regret": 0.3546040654182434, "entropy": 0.11043575406074524, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:11:06.120407Z", "loop": 2306, "env_steps": 1417420799, "loss": 0.0038112164475023746, "avg_return": 0.4509306848049164, "regret": 0.3546040654182434, "entropy": 0.10590918362140656, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:11:07.286998Z", "loop": 2307, "env_steps": 1418035199, "loss": 0.003748507471755147, "avg_return": 0.4538443684577942, "regret": 0.3546040654182434, "entropy": 0.11069048941135406, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:11:08.448664Z", "loop": 2308, "env_steps": 1418649599, "loss": 0.0033050731290131807, "avg_return": 0.44716471433639526, "regret": 0.3546040654182434, "entropy": 0.10916280001401901, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:11:09.610001Z", "loop": 2309, "env_steps": 1419263999, "loss": 0.0031592051964253187, "avg_return": 0.44877585768699646, "regret": 0.3546040654182434, "entropy": 0.10358618944883347, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:11:10.818240Z", "loop": 2310, "env_steps": 1419878399, "loss": 0.00288952374830842, "avg_return": 0.45245561003685, "regret": 0.35246962308883667, "entropy": 0.10722187906503677, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:11:11.985653Z", "loop": 2311, "env_steps": 1420492799, "loss": 0.0030715034808963537, "avg_return": 0.4573540985584259, "regret": 0.35246962308883667, "entropy": 0.10306815057992935, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:11:13.146326Z", "loop": 2312, "env_steps": 1421107199, "loss": 0.002772342413663864, "avg_return": 0.45380401611328125, "regret": 0.35246962308883667, "entropy": 0.10466582328081131, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:11:14.312878Z", "loop": 2313, "env_steps": 1421721599, "loss": 0.0021759825758635998, "avg_return": 0.44426360726356506, "regret": 0.35246962308883667, "entropy": 0.10379219800233841, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:11:15.475151Z", "loop": 2314, "env_steps": 1422335999, "loss": 0.002308394992724061, "avg_return": 0.4487941563129425, "regret": 0.35246962308883667, "entropy": 0.09668536484241486, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:11:16.636824Z", "loop": 2315, "env_steps": 1422950399, "loss": 0.002317541278898716, "avg_return": 0.45476746559143066, "regret": 0.35246962308883667, "entropy": 0.09552046656608582, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:11:17.804629Z", "loop": 2316, "env_steps": 1423564799, "loss": 0.0021586609072983265, "avg_return": 0.45185720920562744, "regret": 0.35246962308883667, "entropy": 0.1002407893538475, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:11:18.964274Z", "loop": 2317, "env_steps": 1424179199, "loss": 0.0020141403656452894, "avg_return": 0.45169878005981445, "regret": 0.35246962308883667, "entropy": 0.09899389743804932, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:11:20.124951Z", "loop": 2318, "env_steps": 1424793599, "loss": 0.002090390305966139, "avg_return": 0.4523211717605591, "regret": 0.35246962308883667, "entropy": 0.09752584248781204, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:11:21.284751Z", "loop": 2319, "env_steps": 1425407999, "loss": 0.002111834241077304, "avg_return": 0.4523950219154358, "regret": 0.35246962308883667, "entropy": 0.10328641533851624, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:11:22.497777Z", "loop": 2320, "env_steps": 1426022399, "loss": 0.0018920404836535454, "avg_return": 0.458019882440567, "regret": 0.3521144986152649, "entropy": 0.09261232614517212, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:11:23.664179Z", "loop": 2321, "env_steps": 1426636799, "loss": 0.001966128358617425, "avg_return": 0.4534187316894531, "regret": 0.3521144986152649, "entropy": 0.09608474373817444, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:11:24.826478Z", "loop": 2322, "env_steps": 1427251199, "loss": 0.0018801449332386255, "avg_return": 0.441394567489624, "regret": 0.3521144986152649, "entropy": 0.10245568305253983, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:11:25.988945Z", "loop": 2323, "env_steps": 1427865599, "loss": 0.0019163064425811172, "avg_return": 0.45144322514533997, "regret": 0.3521144986152649, "entropy": 0.09780305624008179, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:11:27.149496Z", "loop": 2324, "env_steps": 1428479999, "loss": 0.001985154114663601, "avg_return": 0.4495164453983307, "regret": 0.3521144986152649, "entropy": 0.09410715103149414, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:11:28.311559Z", "loop": 2325, "env_steps": 1429094399, "loss": 0.0020063358824700117, "avg_return": 0.4571155309677124, "regret": 0.3521144986152649, "entropy": 0.09657742083072662, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:11:29.474708Z", "loop": 2326, "env_steps": 1429708799, "loss": 0.002003251574933529, "avg_return": 0.4513123631477356, "regret": 0.3521144986152649, "entropy": 0.09720151871442795, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:11:30.634115Z", "loop": 2327, "env_steps": 1430323199, "loss": 0.001871496089734137, "avg_return": 0.4501371383666992, "regret": 0.3521144986152649, "entropy": 0.09956932812929153, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:11:31.795675Z", "loop": 2328, "env_steps": 1430937599, "loss": 0.001715641119517386, "avg_return": 0.4508861303329468, "regret": 0.3521144986152649, "entropy": 0.10423330962657928, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:11:32.956202Z", "loop": 2329, "env_steps": 1431551999, "loss": 0.0021173341665416956, "avg_return": 0.45091187953948975, "regret": 0.3521144986152649, "entropy": 0.10242073237895966, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:11:34.164388Z", "loop": 2330, "env_steps": 1432166399, "loss": 0.002215668326243758, "avg_return": 0.4582902193069458, "regret": 0.3527089059352875, "entropy": 0.10212119668722153, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:11:35.323445Z", "loop": 2331, "env_steps": 1432780799, "loss": 0.0017178867710754275, "avg_return": 0.44827210903167725, "regret": 0.3527089059352875, "entropy": 0.09771415591239929, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:11:36.484427Z", "loop": 2332, "env_steps": 1433395199, "loss": 0.0018602794734761119, "avg_return": 0.44776302576065063, "regret": 0.3527089059352875, "entropy": 0.09799283742904663, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:11:37.643749Z", "loop": 2333, "env_steps": 1434009599, "loss": 0.0020123410504311323, "avg_return": 0.45030665397644043, "regret": 0.3527089059352875, "entropy": 0.0963243693113327, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:11:38.804949Z", "loop": 2334, "env_steps": 1434623999, "loss": 0.0018209246918559074, "avg_return": 0.4508901536464691, "regret": 0.3527089059352875, "entropy": 0.10033291578292847, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:11:39.965110Z", "loop": 2335, "env_steps": 1435238399, "loss": 0.0016802639001980424, "avg_return": 0.4559895992279053, "regret": 0.3527089059352875, "entropy": 0.09257224947214127, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:11:41.125511Z", "loop": 2336, "env_steps": 1435852799, "loss": 0.0016867200611159205, "avg_return": 0.4547949433326721, "regret": 0.3527089059352875, "entropy": 0.10364815592765808, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:11:42.286255Z", "loop": 2337, "env_steps": 1436467199, "loss": 0.0017568323528394103, "avg_return": 0.456189900636673, "regret": 0.3527089059352875, "entropy": 0.10095865279436111, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:11:43.445671Z", "loop": 2338, "env_steps": 1437081599, "loss": 0.0019181432435289025, "avg_return": 0.46000662446022034, "regret": 0.3527089059352875, "entropy": 0.0978226587176323, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:11:44.606680Z", "loop": 2339, "env_steps": 1437695999, "loss": 0.001725209760479629, "avg_return": 0.44826823472976685, "regret": 0.3527089059352875, "entropy": 0.09821825474500656, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:11:45.814880Z", "loop": 2340, "env_steps": 1438310399, "loss": 0.0018393726786598563, "avg_return": 0.45125874876976013, "regret": 0.35229796171188354, "entropy": 0.1023302972316742, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:11:46.977344Z", "loop": 2341, "env_steps": 1438924799, "loss": 0.0018003362929448485, "avg_return": 0.44907069206237793, "regret": 0.35229796171188354, "entropy": 0.10134495794773102, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:11:48.139086Z", "loop": 2342, "env_steps": 1439539199, "loss": 0.001987290335819125, "avg_return": 0.4547663629055023, "regret": 0.35229796171188354, "entropy": 0.10053781419992447, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:11:49.300892Z", "loop": 2343, "env_steps": 1440153599, "loss": 0.002022214001044631, "avg_return": 0.4501364231109619, "regret": 0.35229796171188354, "entropy": 0.10272112488746643, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:11:50.460984Z", "loop": 2344, "env_steps": 1440767999, "loss": 0.0021007710602134466, "avg_return": 0.4579734802246094, "regret": 0.35229796171188354, "entropy": 0.10227498412132263, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:11:51.622004Z", "loop": 2345, "env_steps": 1441382399, "loss": 0.0021569975651800632, "avg_return": 0.44585293531417847, "regret": 0.35229796171188354, "entropy": 0.10602038353681564, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:11:52.783878Z", "loop": 2346, "env_steps": 1441996799, "loss": 0.0021770643070340157, "avg_return": 0.45413702726364136, "regret": 0.35229796171188354, "entropy": 0.10904021561145782, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:11:53.943705Z", "loop": 2347, "env_steps": 1442611199, "loss": 0.0018949148943647742, "avg_return": 0.45267629623413086, "regret": 0.35229796171188354, "entropy": 0.10815013200044632, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:11:55.104335Z", "loop": 2348, "env_steps": 1443225599, "loss": 0.0019373024115338922, "avg_return": 0.44707417488098145, "regret": 0.35229796171188354, "entropy": 0.1058759093284607, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:11:56.263920Z", "loop": 2349, "env_steps": 1443839999, "loss": 0.0020459420047700405, "avg_return": 0.4503629803657532, "regret": 0.35229796171188354, "entropy": 0.10227979719638824, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:11:57.474284Z", "loop": 2350, "env_steps": 1444454399, "loss": 0.0020749762188643217, "avg_return": 0.4497060179710388, "regret": 0.35126256942749023, "entropy": 0.10250222682952881, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:11:58.637083Z", "loop": 2351, "env_steps": 1445068799, "loss": 0.002675672760233283, "avg_return": 0.44716283679008484, "regret": 0.35126256942749023, "entropy": 0.094185009598732, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:11:59.800766Z", "loop": 2352, "env_steps": 1445683199, "loss": 0.0025051624979823828, "avg_return": 0.45221060514450073, "regret": 0.35126256942749023, "entropy": 0.0990852639079094, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:12:00.960247Z", "loop": 2353, "env_steps": 1446297599, "loss": 0.0030269843991845846, "avg_return": 0.4486237168312073, "regret": 0.35126256942749023, "entropy": 0.10490456223487854, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:12:02.122597Z", "loop": 2354, "env_steps": 1446911999, "loss": 0.0032861405052244663, "avg_return": 0.4549938142299652, "regret": 0.35126256942749023, "entropy": 0.10069020837545395, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:12:03.285329Z", "loop": 2355, "env_steps": 1447526399, "loss": 0.003733657766133547, "avg_return": 0.45678824186325073, "regret": 0.35126256942749023, "entropy": 0.10657516121864319, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:12:04.444928Z", "loop": 2356, "env_steps": 1448140799, "loss": 0.0036253866273909807, "avg_return": 0.4543617367744446, "regret": 0.35126256942749023, "entropy": 0.10378169268369675, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:12:05.606296Z", "loop": 2357, "env_steps": 1448755199, "loss": 0.003425822826102376, "avg_return": 0.4575640857219696, "regret": 0.35126256942749023, "entropy": 0.10302161425352097, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:12:06.766403Z", "loop": 2358, "env_steps": 1449369599, "loss": 0.0036240704357624054, "avg_return": 0.4557429552078247, "regret": 0.35126256942749023, "entropy": 0.113401398062706, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:12:07.926570Z", "loop": 2359, "env_steps": 1449983999, "loss": 0.0036820550449192524, "avg_return": 0.4533448815345764, "regret": 0.35126256942749023, "entropy": 0.11345578730106354, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:12:09.137070Z", "loop": 2360, "env_steps": 1450598399, "loss": 0.0034610701259225607, "avg_return": 0.449925035238266, "regret": 0.35210537910461426, "entropy": 0.10655338317155838, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:12:10.299440Z", "loop": 2361, "env_steps": 1451212799, "loss": 0.0031154153402894735, "avg_return": 0.4512955844402313, "regret": 0.35210537910461426, "entropy": 0.11368928104639053, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:12:11.461436Z", "loop": 2362, "env_steps": 1451827199, "loss": 0.0027859013061970472, "avg_return": 0.454782634973526, "regret": 0.35210537910461426, "entropy": 0.10604898631572723, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:12:12.622310Z", "loop": 2363, "env_steps": 1452441599, "loss": 0.0022899555042386055, "avg_return": 0.4531121850013733, "regret": 0.35210537910461426, "entropy": 0.1084555983543396, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:12:13.784981Z", "loop": 2364, "env_steps": 1453055999, "loss": 0.0022682154085487127, "avg_return": 0.4490070343017578, "regret": 0.35210537910461426, "entropy": 0.1032489463686943, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:12:14.944482Z", "loop": 2365, "env_steps": 1453670399, "loss": 0.0025680772960186005, "avg_return": 0.4501241147518158, "regret": 0.35210537910461426, "entropy": 0.10748674720525742, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:12:16.104721Z", "loop": 2366, "env_steps": 1454284799, "loss": 0.0021625529043376446, "avg_return": 0.45230937004089355, "regret": 0.35210537910461426, "entropy": 0.11104501783847809, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:12:17.265196Z", "loop": 2367, "env_steps": 1454899199, "loss": 0.002155756577849388, "avg_return": 0.45421600341796875, "regret": 0.35210537910461426, "entropy": 0.10486213862895966, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:12:18.425894Z", "loop": 2368, "env_steps": 1455513599, "loss": 0.0019553143065422773, "avg_return": 0.4518395960330963, "regret": 0.35210537910461426, "entropy": 0.09877680987119675, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:12:19.586706Z", "loop": 2369, "env_steps": 1456127999, "loss": 0.0016409879317507148, "avg_return": 0.45216137170791626, "regret": 0.35210537910461426, "entropy": 0.10081679373979568, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:12:20.790800Z", "loop": 2370, "env_steps": 1456742399, "loss": 0.0015857787802815437, "avg_return": 0.4499228894710541, "regret": 0.3511514365673065, "entropy": 0.10177683085203171, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:12:21.957931Z", "loop": 2371, "env_steps": 1457356799, "loss": 0.0016970158321782947, "avg_return": 0.4534960687160492, "regret": 0.3511514365673065, "entropy": 0.09309902787208557, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:12:23.118876Z", "loop": 2372, "env_steps": 1457971199, "loss": 0.001634374144487083, "avg_return": 0.4484500288963318, "regret": 0.3511514365673065, "entropy": 0.10180915147066116, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:12:24.281260Z", "loop": 2373, "env_steps": 1458585599, "loss": 0.002252802951261401, "avg_return": 0.4480724632740021, "regret": 0.3511514365673065, "entropy": 0.10544264316558838, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:12:25.442620Z", "loop": 2374, "env_steps": 1459199999, "loss": 0.0027684883680194616, "avg_return": 0.4577704966068268, "regret": 0.3511514365673065, "entropy": 0.10898251831531525, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:12:26.604419Z", "loop": 2375, "env_steps": 1459814399, "loss": 0.0034215424675494432, "avg_return": 0.4505176544189453, "regret": 0.3511514365673065, "entropy": 0.12103761732578278, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:12:27.765470Z", "loop": 2376, "env_steps": 1460428799, "loss": 0.0031468586530536413, "avg_return": 0.4438008666038513, "regret": 0.3511514365673065, "entropy": 0.11184724420309067, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:12:28.927190Z", "loop": 2377, "env_steps": 1461043199, "loss": 0.0030606219079345465, "avg_return": 0.44633811712265015, "regret": 0.3511514365673065, "entropy": 0.10053908079862595, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:12:30.089598Z", "loop": 2378, "env_steps": 1461657599, "loss": 0.003240204183384776, "avg_return": 0.43906280398368835, "regret": 0.3511514365673065, "entropy": 0.09987254440784454, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:12:31.250053Z", "loop": 2379, "env_steps": 1462271999, "loss": 0.002663158578798175, "avg_return": 0.4456755816936493, "regret": 0.3511514365673065, "entropy": 0.10791205614805222, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:12:32.456299Z", "loop": 2380, "env_steps": 1462886399, "loss": 0.002419119467958808, "avg_return": 0.4567257761955261, "regret": 0.35516151785850525, "entropy": 0.10467632114887238, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:12:33.617476Z", "loop": 2381, "env_steps": 1463500799, "loss": 0.003121227491647005, "avg_return": 0.4544065594673157, "regret": 0.35516151785850525, "entropy": 0.11723194271326065, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:12:34.777739Z", "loop": 2382, "env_steps": 1464115199, "loss": 0.0032097292132675648, "avg_return": 0.4551926851272583, "regret": 0.35516151785850525, "entropy": 0.12266886234283447, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:12:35.937276Z", "loop": 2383, "env_steps": 1464729599, "loss": 0.0028689641039818525, "avg_return": 0.44949808716773987, "regret": 0.35516151785850525, "entropy": 0.1275598108768463, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:12:37.096368Z", "loop": 2384, "env_steps": 1465343999, "loss": 0.0026712226681411266, "avg_return": 0.44802820682525635, "regret": 0.35516151785850525, "entropy": 0.11788070201873779, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:12:38.255596Z", "loop": 2385, "env_steps": 1465958399, "loss": 0.0019793084356933832, "avg_return": 0.45311108231544495, "regret": 0.35516151785850525, "entropy": 0.10908249765634537, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:12:39.414862Z", "loop": 2386, "env_steps": 1466572799, "loss": 0.0017310196999460459, "avg_return": 0.4504515826702118, "regret": 0.35516151785850525, "entropy": 0.11553943157196045, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:12:40.574717Z", "loop": 2387, "env_steps": 1467187199, "loss": 0.0018762057879939675, "avg_return": 0.4496642053127289, "regret": 0.35516151785850525, "entropy": 0.10706035792827606, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:12:41.733839Z", "loop": 2388, "env_steps": 1467801599, "loss": 0.0017777284374460578, "avg_return": 0.4518652558326721, "regret": 0.35516151785850525, "entropy": 0.11162011325359344, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:12:42.894385Z", "loop": 2389, "env_steps": 1468415999, "loss": 0.0016523459926247597, "avg_return": 0.4521154761314392, "regret": 0.35516151785850525, "entropy": 0.1116042211651802, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:12:44.096873Z", "loop": 2390, "env_steps": 1469030399, "loss": 0.0017641913145780563, "avg_return": 0.45010462403297424, "regret": 0.351131796836853, "entropy": 0.11427447944879532, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:12:45.257557Z", "loop": 2391, "env_steps": 1469644799, "loss": 0.0018533881520852447, "avg_return": 0.4514857232570648, "regret": 0.351131796836853, "entropy": 0.11265541613101959, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:12:46.417300Z", "loop": 2392, "env_steps": 1470259199, "loss": 0.0018749472219496965, "avg_return": 0.4549218416213989, "regret": 0.351131796836853, "entropy": 0.12166876345872879, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:12:47.577339Z", "loop": 2393, "env_steps": 1470873599, "loss": 0.002151662018150091, "avg_return": 0.4512821435928345, "regret": 0.351131796836853, "entropy": 0.11967537552118301, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:12:48.736766Z", "loop": 2394, "env_steps": 1471487999, "loss": 0.002323511755093932, "avg_return": 0.451162725687027, "regret": 0.351131796836853, "entropy": 0.1165916845202446, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:12:49.897527Z", "loop": 2395, "env_steps": 1472102399, "loss": 0.0022800450678914785, "avg_return": 0.4548282027244568, "regret": 0.351131796836853, "entropy": 0.11329985409975052, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:12:51.056882Z", "loop": 2396, "env_steps": 1472716799, "loss": 0.0022028270177543163, "avg_return": 0.44704470038414, "regret": 0.351131796836853, "entropy": 0.12182069569826126, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:12:52.216627Z", "loop": 2397, "env_steps": 1473331199, "loss": 0.002524918643757701, "avg_return": 0.4557746946811676, "regret": 0.351131796836853, "entropy": 0.11430367082357407, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:12:53.375634Z", "loop": 2398, "env_steps": 1473945599, "loss": 0.0023324103094637394, "avg_return": 0.4469009041786194, "regret": 0.351131796836853, "entropy": 0.11210248619318008, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:12:54.536112Z", "loop": 2399, "env_steps": 1474559999, "loss": 0.0026939474046230316, "avg_return": 0.45185354351997375, "regret": 0.351131796836853, "entropy": 0.11440301686525345, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:12:55.741323Z", "loop": 2400, "env_steps": 1475174399, "loss": 0.0025072211865335703, "avg_return": 0.4495885372161865, "regret": 0.3520744740962982, "entropy": 0.11364689469337463, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:12:56.901867Z", "loop": 2401, "env_steps": 1475788799, "loss": 0.0023929947055876255, "avg_return": 0.44424840807914734, "regret": 0.3520744740962982, "entropy": 0.11000503599643707, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:12:58.061973Z", "loop": 2402, "env_steps": 1476403199, "loss": 0.0023361791390925646, "avg_return": 0.4504551291465759, "regret": 0.3520744740962982, "entropy": 0.11625906080007553, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:12:59.222489Z", "loop": 2403, "env_steps": 1477017599, "loss": 0.0022322461009025574, "avg_return": 0.4482440948486328, "regret": 0.3520744740962982, "entropy": 0.11114219576120377, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:13:00.387190Z", "loop": 2404, "env_steps": 1477631999, "loss": 0.0019132249290123582, "avg_return": 0.4528292417526245, "regret": 0.3520744740962982, "entropy": 0.10517774522304535, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:13:01.553459Z", "loop": 2405, "env_steps": 1478246399, "loss": 0.0020904960110783577, "avg_return": 0.4540213644504547, "regret": 0.3520744740962982, "entropy": 0.11216812580823898, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:13:02.713862Z", "loop": 2406, "env_steps": 1478860799, "loss": 0.0016008879756554961, "avg_return": 0.4587486982345581, "regret": 0.3520744740962982, "entropy": 0.10581380873918533, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:13:03.872986Z", "loop": 2407, "env_steps": 1479475199, "loss": 0.0017887449357658625, "avg_return": 0.4556974470615387, "regret": 0.3520744740962982, "entropy": 0.10301196575164795, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:13:05.033119Z", "loop": 2408, "env_steps": 1480089599, "loss": 0.0020494672935456038, "avg_return": 0.4539538323879242, "regret": 0.3520744740962982, "entropy": 0.113772913813591, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:13:06.194145Z", "loop": 2409, "env_steps": 1480703999, "loss": 0.0023834898602217436, "avg_return": 0.4487895965576172, "regret": 0.3520744740962982, "entropy": 0.12726081907749176, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:13:07.398476Z", "loop": 2410, "env_steps": 1481318399, "loss": 0.0031518451869487762, "avg_return": 0.4536103308200836, "regret": 0.3519975543022156, "entropy": 0.13126260042190552, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:13:08.560036Z", "loop": 2411, "env_steps": 1481932799, "loss": 0.0031380050349980593, "avg_return": 0.45706889033317566, "regret": 0.3519975543022156, "entropy": 0.13549721240997314, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:13:09.720552Z", "loop": 2412, "env_steps": 1482547199, "loss": 0.0029243852477520704, "avg_return": 0.44940629601478577, "regret": 0.3519975543022156, "entropy": 0.13666373491287231, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:13:10.881041Z", "loop": 2413, "env_steps": 1483161599, "loss": 0.002858091378584504, "avg_return": 0.44838106632232666, "regret": 0.3519975543022156, "entropy": 0.12141026556491852, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:13:12.040649Z", "loop": 2414, "env_steps": 1483775999, "loss": 0.002599831437692046, "avg_return": 0.4553428292274475, "regret": 0.3519975543022156, "entropy": 0.11903812736272812, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:13:13.202214Z", "loop": 2415, "env_steps": 1484390399, "loss": 0.0023261168971657753, "avg_return": 0.4531860947608948, "regret": 0.3519975543022156, "entropy": 0.11148464679718018, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:13:14.367068Z", "loop": 2416, "env_steps": 1485004799, "loss": 0.0020344576332718134, "avg_return": 0.4448617100715637, "regret": 0.3519975543022156, "entropy": 0.11101984232664108, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:13:15.527303Z", "loop": 2417, "env_steps": 1485619199, "loss": 0.002060087164863944, "avg_return": 0.44196468591690063, "regret": 0.3519975543022156, "entropy": 0.10519447922706604, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:13:16.689187Z", "loop": 2418, "env_steps": 1486233599, "loss": 0.0017612975789234042, "avg_return": 0.4438367784023285, "regret": 0.3519975543022156, "entropy": 0.10726691037416458, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:13:17.848686Z", "loop": 2419, "env_steps": 1486847999, "loss": 0.0021811395417898893, "avg_return": 0.4512447714805603, "regret": 0.3519975543022156, "entropy": 0.10065829753875732, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:13:19.056620Z", "loop": 2420, "env_steps": 1487462399, "loss": 0.0016975060570985079, "avg_return": 0.4426155686378479, "regret": 0.35457220673561096, "entropy": 0.1101033091545105, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:13:20.218343Z", "loop": 2421, "env_steps": 1488076799, "loss": 0.0020055414643138647, "avg_return": 0.44900545477867126, "regret": 0.35457220673561096, "entropy": 0.10921216756105423, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:13:21.380162Z", "loop": 2422, "env_steps": 1488691199, "loss": 0.002108258893713355, "avg_return": 0.4531056880950928, "regret": 0.35457220673561096, "entropy": 0.11069565266370773, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:13:22.540788Z", "loop": 2423, "env_steps": 1489305599, "loss": 0.0023106816224753857, "avg_return": 0.4457559287548065, "regret": 0.35457220673561096, "entropy": 0.11411404609680176, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:13:23.702544Z", "loop": 2424, "env_steps": 1489919999, "loss": 0.0025978265330195427, "avg_return": 0.45336151123046875, "regret": 0.35457220673561096, "entropy": 0.11027778685092926, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:13:24.864763Z", "loop": 2425, "env_steps": 1490534399, "loss": 0.0025865703355520964, "avg_return": 0.45334169268608093, "regret": 0.35457220673561096, "entropy": 0.115557961165905, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:13:26.025184Z", "loop": 2426, "env_steps": 1491148799, "loss": 0.00264250417239964, "avg_return": 0.44809165596961975, "regret": 0.35457220673561096, "entropy": 0.11276847869157791, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:13:27.186366Z", "loop": 2427, "env_steps": 1491763199, "loss": 0.0021383981220424175, "avg_return": 0.4432370066642761, "regret": 0.35457220673561096, "entropy": 0.1099543422460556, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:13:28.346624Z", "loop": 2428, "env_steps": 1492377599, "loss": 0.0021384682040661573, "avg_return": 0.4500734508037567, "regret": 0.35457220673561096, "entropy": 0.11130144447088242, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:13:29.507592Z", "loop": 2429, "env_steps": 1492991999, "loss": 0.002603336237370968, "avg_return": 0.458976149559021, "regret": 0.35457220673561096, "entropy": 0.10968820750713348, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:13:30.713406Z", "loop": 2430, "env_steps": 1493606399, "loss": 0.002744566649198532, "avg_return": 0.4604041278362274, "regret": 0.35249677300453186, "entropy": 0.10963719338178635, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:13:31.874290Z", "loop": 2431, "env_steps": 1494220799, "loss": 0.0021920728031545877, "avg_return": 0.45595836639404297, "regret": 0.35249677300453186, "entropy": 0.11243108659982681, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:13:33.034450Z", "loop": 2432, "env_steps": 1494835199, "loss": 0.0022449439857155085, "avg_return": 0.44832301139831543, "regret": 0.35249677300453186, "entropy": 0.10941965132951736, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:13:34.195485Z", "loop": 2433, "env_steps": 1495449599, "loss": 0.002122564008459449, "avg_return": 0.44938671588897705, "regret": 0.35249677300453186, "entropy": 0.10815945267677307, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:13:35.355421Z", "loop": 2434, "env_steps": 1496063999, "loss": 0.0022510250564664602, "avg_return": 0.453443706035614, "regret": 0.35249677300453186, "entropy": 0.11239264160394669, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:13:36.515937Z", "loop": 2435, "env_steps": 1496678399, "loss": 0.0022408326622098684, "avg_return": 0.4502611458301544, "regret": 0.35249677300453186, "entropy": 0.10929039865732193, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:13:37.677268Z", "loop": 2436, "env_steps": 1497292799, "loss": 0.002120778663083911, "avg_return": 0.44919729232788086, "regret": 0.35249677300453186, "entropy": 0.11074990779161453, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:13:38.837978Z", "loop": 2437, "env_steps": 1497907199, "loss": 0.0024002015125006437, "avg_return": 0.4531938135623932, "regret": 0.35249677300453186, "entropy": 0.1133493185043335, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:13:39.999708Z", "loop": 2438, "env_steps": 1498521599, "loss": 0.0024037256371229887, "avg_return": 0.44904398918151855, "regret": 0.35249677300453186, "entropy": 0.11079179495573044, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:13:41.159794Z", "loop": 2439, "env_steps": 1499135999, "loss": 0.0024349733721464872, "avg_return": 0.448212593793869, "regret": 0.35249677300453186, "entropy": 0.11881964653730392, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:13:42.365915Z", "loop": 2440, "env_steps": 1499750399, "loss": 0.002584986388683319, "avg_return": 0.45609980821609497, "regret": 0.3517150282859802, "entropy": 0.10978570580482483, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:13:43.525823Z", "loop": 2441, "env_steps": 1500364799, "loss": 0.0027012915816158056, "avg_return": 0.447289377450943, "regret": 0.3517150282859802, "entropy": 0.12261798232793808, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:13:44.687073Z", "loop": 2442, "env_steps": 1500979199, "loss": 0.0027768395375460386, "avg_return": 0.4525085985660553, "regret": 0.3517150282859802, "entropy": 0.11561848968267441, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:13:45.846725Z", "loop": 2443, "env_steps": 1501593599, "loss": 0.0028547595720738173, "avg_return": 0.4522612690925598, "regret": 0.3517150282859802, "entropy": 0.12323082983493805, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:13:47.007188Z", "loop": 2444, "env_steps": 1502207999, "loss": 0.0028645405545830727, "avg_return": 0.4496314227581024, "regret": 0.3517150282859802, "entropy": 0.11850579082965851, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:13:48.166833Z", "loop": 2445, "env_steps": 1502822399, "loss": 0.0029878844507038593, "avg_return": 0.451442688703537, "regret": 0.3517150282859802, "entropy": 0.12739403545856476, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:13:49.326839Z", "loop": 2446, "env_steps": 1503436799, "loss": 0.0027794414199888706, "avg_return": 0.4419548511505127, "regret": 0.3517150282859802, "entropy": 0.12344174832105637, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:13:50.487758Z", "loop": 2447, "env_steps": 1504051199, "loss": 0.0029516303911805153, "avg_return": 0.44143834710121155, "regret": 0.3517150282859802, "entropy": 0.11732272058725357, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:13:51.647666Z", "loop": 2448, "env_steps": 1504665599, "loss": 0.0027134218253195286, "avg_return": 0.4548363983631134, "regret": 0.3517150282859802, "entropy": 0.1192636713385582, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:13:52.808616Z", "loop": 2449, "env_steps": 1505279999, "loss": 0.0027542980387806892, "avg_return": 0.45469656586647034, "regret": 0.3517150282859802, "entropy": 0.11096687614917755, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:13:54.014290Z", "loop": 2450, "env_steps": 1505894399, "loss": 0.0025159253273159266, "avg_return": 0.4502814710140228, "regret": 0.3523278534412384, "entropy": 0.11150379478931427, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:13:55.175505Z", "loop": 2451, "env_steps": 1506508799, "loss": 0.002413076115772128, "avg_return": 0.45358195900917053, "regret": 0.3523278534412384, "entropy": 0.10818678885698318, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:13:56.335213Z", "loop": 2452, "env_steps": 1507123199, "loss": 0.0022736494429409504, "avg_return": 0.44752687215805054, "regret": 0.3523278534412384, "entropy": 0.10461347550153732, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:13:57.496198Z", "loop": 2453, "env_steps": 1507737599, "loss": 0.0021597135346382856, "avg_return": 0.4495139718055725, "regret": 0.3523278534412384, "entropy": 0.09702827781438828, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:13:58.655936Z", "loop": 2454, "env_steps": 1508351999, "loss": 0.0020398336928337812, "avg_return": 0.449079304933548, "regret": 0.3523278534412384, "entropy": 0.09273257851600647, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:13:59.816346Z", "loop": 2455, "env_steps": 1508966399, "loss": 0.0020680546294897795, "avg_return": 0.43792182207107544, "regret": 0.3523278534412384, "entropy": 0.10024061053991318, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:14:00.978029Z", "loop": 2456, "env_steps": 1509580799, "loss": 0.002261905698105693, "avg_return": 0.4457465708255768, "regret": 0.3523278534412384, "entropy": 0.10492527484893799, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:14:02.138493Z", "loop": 2457, "env_steps": 1510195199, "loss": 0.002027274575084448, "avg_return": 0.4560377597808838, "regret": 0.3523278534412384, "entropy": 0.09680385887622833, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:14:03.299683Z", "loop": 2458, "env_steps": 1510809599, "loss": 0.0022707327734678984, "avg_return": 0.459104984998703, "regret": 0.3523278534412384, "entropy": 0.09566443413496017, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:14:04.459475Z", "loop": 2459, "env_steps": 1511423999, "loss": 0.0024960082955658436, "avg_return": 0.45793724060058594, "regret": 0.3523278534412384, "entropy": 0.1040540412068367, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:14:05.673130Z", "loop": 2460, "env_steps": 1512038399, "loss": 0.002634223084896803, "avg_return": 0.44431138038635254, "regret": 0.353727787733078, "entropy": 0.10908157378435135, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:14:06.833965Z", "loop": 2461, "env_steps": 1512652799, "loss": 0.0026319604367017746, "avg_return": 0.44337892532348633, "regret": 0.353727787733078, "entropy": 0.11828572303056717, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:14:07.995339Z", "loop": 2462, "env_steps": 1513267199, "loss": 0.0029835246969014406, "avg_return": 0.4431709945201874, "regret": 0.353727787733078, "entropy": 0.12314696609973907, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:14:09.155337Z", "loop": 2463, "env_steps": 1513881599, "loss": 0.0032814263831824064, "avg_return": 0.45181208848953247, "regret": 0.353727787733078, "entropy": 0.13197819888591766, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:14:10.316449Z", "loop": 2464, "env_steps": 1514495999, "loss": 0.003547385800629854, "avg_return": 0.4512683153152466, "regret": 0.353727787733078, "entropy": 0.1361013948917389, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:14:11.477717Z", "loop": 2465, "env_steps": 1515110399, "loss": 0.0035612047649919987, "avg_return": 0.4495185315608978, "regret": 0.353727787733078, "entropy": 0.13999761641025543, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:14:12.637728Z", "loop": 2466, "env_steps": 1515724799, "loss": 0.0035693214740604162, "avg_return": 0.453119158744812, "regret": 0.353727787733078, "entropy": 0.13049989938735962, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:14:13.798908Z", "loop": 2467, "env_steps": 1516339199, "loss": 0.0029928775038570166, "avg_return": 0.4544101059436798, "regret": 0.353727787733078, "entropy": 0.12408063560724258, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:14:14.959255Z", "loop": 2468, "env_steps": 1516953599, "loss": 0.0025729527696967125, "avg_return": 0.4477806091308594, "regret": 0.353727787733078, "entropy": 0.11572249233722687, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:14:16.121057Z", "loop": 2469, "env_steps": 1517567999, "loss": 0.002562753390520811, "avg_return": 0.4518817663192749, "regret": 0.353727787733078, "entropy": 0.1199033260345459, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:14:17.329170Z", "loop": 2470, "env_steps": 1518182399, "loss": 0.002557543106377125, "avg_return": 0.4508138597011566, "regret": 0.35153084993362427, "entropy": 0.10855360329151154, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:14:18.491310Z", "loop": 2471, "env_steps": 1518796799, "loss": 0.0027342052198946476, "avg_return": 0.453956663608551, "regret": 0.35153084993362427, "entropy": 0.11691707372665405, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:14:19.650903Z", "loop": 2472, "env_steps": 1519411199, "loss": 0.0030532802920788527, "avg_return": 0.4501568078994751, "regret": 0.35153084993362427, "entropy": 0.12505167722702026, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:14:20.811035Z", "loop": 2473, "env_steps": 1520025599, "loss": 0.0030349534936249256, "avg_return": 0.45822134613990784, "regret": 0.35153084993362427, "entropy": 0.12545572221279144, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:14:21.971530Z", "loop": 2474, "env_steps": 1520639999, "loss": 0.003328651189804077, "avg_return": 0.45366308093070984, "regret": 0.35153084993362427, "entropy": 0.12887710332870483, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:14:23.131168Z", "loop": 2475, "env_steps": 1521254399, "loss": 0.003205176442861557, "avg_return": 0.44963541626930237, "regret": 0.35153084993362427, "entropy": 0.13285720348358154, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:14:24.292719Z", "loop": 2476, "env_steps": 1521868799, "loss": 0.0032377575989812613, "avg_return": 0.46443966031074524, "regret": 0.35153084993362427, "entropy": 0.12576918303966522, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:14:25.452968Z", "loop": 2477, "env_steps": 1522483199, "loss": 0.002745852805674076, "avg_return": 0.45074498653411865, "regret": 0.35153084993362427, "entropy": 0.12688329815864563, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:14:26.613995Z", "loop": 2478, "env_steps": 1523097599, "loss": 0.0024293907918035984, "avg_return": 0.45482301712036133, "regret": 0.35153084993362427, "entropy": 0.11408907920122147, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:14:27.773432Z", "loop": 2479, "env_steps": 1523711999, "loss": 0.002456525806337595, "avg_return": 0.4505249261856079, "regret": 0.35153084993362427, "entropy": 0.11600838601589203, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:14:28.979537Z", "loop": 2480, "env_steps": 1524326399, "loss": 0.0022280269768089056, "avg_return": 0.4549817144870758, "regret": 0.35100722312927246, "entropy": 0.11186768114566803, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:14:30.140888Z", "loop": 2481, "env_steps": 1524940799, "loss": 0.0024231094866991043, "avg_return": 0.4525746703147888, "regret": 0.35100722312927246, "entropy": 0.11524882912635803, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:14:31.301500Z", "loop": 2482, "env_steps": 1525555199, "loss": 0.002355025615543127, "avg_return": 0.4524654150009155, "regret": 0.35100722312927246, "entropy": 0.10776805132627487, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:14:32.462899Z", "loop": 2483, "env_steps": 1526169599, "loss": 0.0020587604958564043, "avg_return": 0.45069172978401184, "regret": 0.35100722312927246, "entropy": 0.10697942227125168, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:14:33.623216Z", "loop": 2484, "env_steps": 1526783999, "loss": 0.0020900333765894175, "avg_return": 0.4521331489086151, "regret": 0.35100722312927246, "entropy": 0.10675844550132751, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:14:34.784763Z", "loop": 2485, "env_steps": 1527398399, "loss": 0.0020552591886371374, "avg_return": 0.4535573422908783, "regret": 0.35100722312927246, "entropy": 0.10736339539289474, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:14:35.944878Z", "loop": 2486, "env_steps": 1528012799, "loss": 0.0025227004662156105, "avg_return": 0.45458686351776123, "regret": 0.35100722312927246, "entropy": 0.10296334326267242, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:14:37.106038Z", "loop": 2487, "env_steps": 1528627199, "loss": 0.00264995195902884, "avg_return": 0.4547131359577179, "regret": 0.35100722312927246, "entropy": 0.11226703971624374, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:14:38.266039Z", "loop": 2488, "env_steps": 1529241599, "loss": 0.0028995962347835302, "avg_return": 0.4484825134277344, "regret": 0.35100722312927246, "entropy": 0.1145530417561531, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:14:39.426222Z", "loop": 2489, "env_steps": 1529855999, "loss": 0.0026274577248841524, "avg_return": 0.4490906894207001, "regret": 0.35100722312927246, "entropy": 0.1027250811457634, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:14:40.634707Z", "loop": 2490, "env_steps": 1530470399, "loss": 0.002452970016747713, "avg_return": 0.4512692987918854, "regret": 0.3512066900730133, "entropy": 0.10781722515821457, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:14:41.795139Z", "loop": 2491, "env_steps": 1531084799, "loss": 0.002753492211923003, "avg_return": 0.4583023190498352, "regret": 0.3512066900730133, "entropy": 0.10771922767162323, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:14:42.955247Z", "loop": 2492, "env_steps": 1531699199, "loss": 0.0028254264034330845, "avg_return": 0.4523211717605591, "regret": 0.3512066900730133, "entropy": 0.10359751433134079, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:14:44.115855Z", "loop": 2493, "env_steps": 1532313599, "loss": 0.0027133163530379534, "avg_return": 0.4481566548347473, "regret": 0.3512066900730133, "entropy": 0.10208660364151001, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:14:45.277340Z", "loop": 2494, "env_steps": 1532927999, "loss": 0.0027759470976889133, "avg_return": 0.4579564034938812, "regret": 0.3512066900730133, "entropy": 0.09983905404806137, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:14:46.437427Z", "loop": 2495, "env_steps": 1533542399, "loss": 0.002535149920731783, "avg_return": 0.45007914304733276, "regret": 0.3512066900730133, "entropy": 0.09128778427839279, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:14:47.598632Z", "loop": 2496, "env_steps": 1534156799, "loss": 0.002426085527986288, "avg_return": 0.455501526594162, "regret": 0.3512066900730133, "entropy": 0.09008114039897919, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:14:48.758699Z", "loop": 2497, "env_steps": 1534771199, "loss": 0.002298267325386405, "avg_return": 0.45157909393310547, "regret": 0.3512066900730133, "entropy": 0.08694303780794144, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:14:49.919527Z", "loop": 2498, "env_steps": 1535385599, "loss": 0.0021974395494908094, "avg_return": 0.44960036873817444, "regret": 0.3512066900730133, "entropy": 0.08450977504253387, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:14:51.080881Z", "loop": 2499, "env_steps": 1535999999, "loss": 0.002229467500001192, "avg_return": 0.45429667830467224, "regret": 0.3512066900730133, "entropy": 0.08276820927858353, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:14:52.286362Z", "loop": 2500, "env_steps": 1536614399, "loss": 0.002398674376308918, "avg_return": 0.444524347782135, "regret": 0.35196778178215027, "entropy": 0.08382066339254379, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:14:53.447203Z", "loop": 2501, "env_steps": 1537228799, "loss": 0.0022971294820308685, "avg_return": 0.4426232874393463, "regret": 0.35196778178215027, "entropy": 0.08335557579994202, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:14:54.608515Z", "loop": 2502, "env_steps": 1537843199, "loss": 0.0022857743315398693, "avg_return": 0.4535622298717499, "regret": 0.35196778178215027, "entropy": 0.07918423414230347, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:14:55.769107Z", "loop": 2503, "env_steps": 1538457599, "loss": 0.0021034979727119207, "avg_return": 0.45313772559165955, "regret": 0.35196778178215027, "entropy": 0.07901669293642044, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:14:56.930286Z", "loop": 2504, "env_steps": 1539071999, "loss": 0.002076872158795595, "avg_return": 0.45381632447242737, "regret": 0.35196778178215027, "entropy": 0.07782041281461716, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:14:58.092063Z", "loop": 2505, "env_steps": 1539686399, "loss": 0.0024231683928519487, "avg_return": 0.45622721314430237, "regret": 0.35196778178215027, "entropy": 0.08287746459245682, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:14:59.252611Z", "loop": 2506, "env_steps": 1540300799, "loss": 0.002124835504218936, "avg_return": 0.45081156492233276, "regret": 0.35196778178215027, "entropy": 0.0858849436044693, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:15:00.413376Z", "loop": 2507, "env_steps": 1540915199, "loss": 0.0022481128107756376, "avg_return": 0.4640144407749176, "regret": 0.35196778178215027, "entropy": 0.09070384502410889, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:15:01.574849Z", "loop": 2508, "env_steps": 1541529599, "loss": 0.002069538924843073, "avg_return": 0.4560582637786865, "regret": 0.35196778178215027, "entropy": 0.09658380597829819, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:15:02.735229Z", "loop": 2509, "env_steps": 1542143999, "loss": 0.0019400559831410646, "avg_return": 0.44959884881973267, "regret": 0.35196778178215027, "entropy": 0.0965404137969017, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:15:03.942384Z", "loop": 2510, "env_steps": 1542758399, "loss": 0.0021397676318883896, "avg_return": 0.44866374135017395, "regret": 0.351087749004364, "entropy": 0.09741031378507614, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:15:05.107134Z", "loop": 2511, "env_steps": 1543372799, "loss": 0.001825244165956974, "avg_return": 0.4554850459098816, "regret": 0.351087749004364, "entropy": 0.09255333244800568, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:15:06.269074Z", "loop": 2512, "env_steps": 1543987199, "loss": 0.0015972655965015292, "avg_return": 0.45165279507637024, "regret": 0.351087749004364, "entropy": 0.09461290389299393, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:15:07.430657Z", "loop": 2513, "env_steps": 1544601599, "loss": 0.001541637466289103, "avg_return": 0.44897589087486267, "regret": 0.351087749004364, "entropy": 0.09081131964921951, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:15:08.593455Z", "loop": 2514, "env_steps": 1545215999, "loss": 0.0012098116567358375, "avg_return": 0.4409075379371643, "regret": 0.351087749004364, "entropy": 0.09097463637590408, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:15:09.753735Z", "loop": 2515, "env_steps": 1545830399, "loss": 0.0016686946619302034, "avg_return": 0.4494006335735321, "regret": 0.351087749004364, "entropy": 0.09411591291427612, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:15:10.919133Z", "loop": 2516, "env_steps": 1546444799, "loss": 0.002061260398477316, "avg_return": 0.44893860816955566, "regret": 0.351087749004364, "entropy": 0.10169339179992676, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:15:12.082641Z", "loop": 2517, "env_steps": 1547059199, "loss": 0.0028860261663794518, "avg_return": 0.4547107517719269, "regret": 0.351087749004364, "entropy": 0.10741981863975525, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:15:13.244672Z", "loop": 2518, "env_steps": 1547673599, "loss": 0.0028881540056318045, "avg_return": 0.44256699085235596, "regret": 0.351087749004364, "entropy": 0.11244254559278488, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:15:14.407136Z", "loop": 2519, "env_steps": 1548287999, "loss": 0.0028837923891842365, "avg_return": 0.45208340883255005, "regret": 0.351087749004364, "entropy": 0.10974688082933426, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:15:15.619352Z", "loop": 2520, "env_steps": 1548902399, "loss": 0.002782293362542987, "avg_return": 0.45237040519714355, "regret": 0.35475417971611023, "entropy": 0.11681642383337021, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:15:16.780616Z", "loop": 2521, "env_steps": 1549516799, "loss": 0.0026502159889787436, "avg_return": 0.4463648498058319, "regret": 0.35475417971611023, "entropy": 0.11438269168138504, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:15:17.940500Z", "loop": 2522, "env_steps": 1550131199, "loss": 0.002928920788690448, "avg_return": 0.4549001157283783, "regret": 0.35475417971611023, "entropy": 0.10435063391923904, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:15:19.100119Z", "loop": 2523, "env_steps": 1550745599, "loss": 0.0024298815988004208, "avg_return": 0.44323068857192993, "regret": 0.35475417971611023, "entropy": 0.10698755830526352, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:15:20.259977Z", "loop": 2524, "env_steps": 1551359999, "loss": 0.0031462765764445066, "avg_return": 0.45996221899986267, "regret": 0.35475417971611023, "entropy": 0.11053890734910965, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:15:21.419394Z", "loop": 2525, "env_steps": 1551974399, "loss": 0.0027166667860001326, "avg_return": 0.45473113656044006, "regret": 0.35475417971611023, "entropy": 0.11059565842151642, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:15:22.580191Z", "loop": 2526, "env_steps": 1552588799, "loss": 0.0025740088894963264, "avg_return": 0.45548829436302185, "regret": 0.35475417971611023, "entropy": 0.10722259432077408, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:15:23.740784Z", "loop": 2527, "env_steps": 1553203199, "loss": 0.001991826808080077, "avg_return": 0.4566497802734375, "regret": 0.35475417971611023, "entropy": 0.09671545028686523, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:15:24.901996Z", "loop": 2528, "env_steps": 1553817599, "loss": 0.0013211136683821678, "avg_return": 0.4510209262371063, "regret": 0.35475417971611023, "entropy": 0.08610659092664719, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:15:26.061892Z", "loop": 2529, "env_steps": 1554431999, "loss": 0.0010801872704178095, "avg_return": 0.4539658725261688, "regret": 0.35475417971611023, "entropy": 0.08462008088827133, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:15:27.268329Z", "loop": 2530, "env_steps": 1555046399, "loss": 0.0010627243900671601, "avg_return": 0.4508809447288513, "regret": 0.35132285952568054, "entropy": 0.08061658591032028, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:15:28.428886Z", "loop": 2531, "env_steps": 1555660799, "loss": 0.0013377465074881911, "avg_return": 0.4492529332637787, "regret": 0.35132285952568054, "entropy": 0.0881938636302948, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:15:29.591098Z", "loop": 2532, "env_steps": 1556275199, "loss": 0.0013473808066919446, "avg_return": 0.45331010222435, "regret": 0.35132285952568054, "entropy": 0.08048082143068314, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:15:30.751536Z", "loop": 2533, "env_steps": 1556889599, "loss": 0.0016959531931206584, "avg_return": 0.45223796367645264, "regret": 0.35132285952568054, "entropy": 0.08908125758171082, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:15:31.912413Z", "loop": 2534, "env_steps": 1557503999, "loss": 0.0017030269373208284, "avg_return": 0.44864529371261597, "regret": 0.35132285952568054, "entropy": 0.09118594229221344, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:15:33.074371Z", "loop": 2535, "env_steps": 1558118399, "loss": 0.0020212118979543447, "avg_return": 0.4529169797897339, "regret": 0.35132285952568054, "entropy": 0.09368876367807388, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:15:34.235205Z", "loop": 2536, "env_steps": 1558732799, "loss": 0.001990524586290121, "avg_return": 0.45461609959602356, "regret": 0.35132285952568054, "entropy": 0.09334608912467957, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:15:35.398247Z", "loop": 2537, "env_steps": 1559347199, "loss": 0.002373253460973501, "avg_return": 0.46071794629096985, "regret": 0.35132285952568054, "entropy": 0.09918982535600662, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:15:36.558984Z", "loop": 2538, "env_steps": 1559961599, "loss": 0.0020592091605067253, "avg_return": 0.44472500681877136, "regret": 0.35132285952568054, "entropy": 0.09596245735883713, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:15:37.719988Z", "loop": 2539, "env_steps": 1560575999, "loss": 0.00191673100925982, "avg_return": 0.453235387802124, "regret": 0.35132285952568054, "entropy": 0.09046211838722229, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:15:38.931085Z", "loop": 2540, "env_steps": 1561190399, "loss": 0.0022997192572802305, "avg_return": 0.4552094638347626, "regret": 0.35099491477012634, "entropy": 0.08982137590646744, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:15:40.095218Z", "loop": 2541, "env_steps": 1561804799, "loss": 0.0026040475349873304, "avg_return": 0.4594578146934509, "regret": 0.35099491477012634, "entropy": 0.08910961449146271, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:15:41.256473Z", "loop": 2542, "env_steps": 1562419199, "loss": 0.002901251194998622, "avg_return": 0.45567765831947327, "regret": 0.35099491477012634, "entropy": 0.08730319887399673, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:15:42.416374Z", "loop": 2543, "env_steps": 1563033599, "loss": 0.0025891067925840616, "avg_return": 0.45245757699012756, "regret": 0.35099491477012634, "entropy": 0.08786716312170029, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:15:43.577003Z", "loop": 2544, "env_steps": 1563647999, "loss": 0.00275578536093235, "avg_return": 0.4518195688724518, "regret": 0.35099491477012634, "entropy": 0.0877571851015091, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:15:44.738238Z", "loop": 2545, "env_steps": 1564262399, "loss": 0.0027979512233287096, "avg_return": 0.4565465450286865, "regret": 0.35099491477012634, "entropy": 0.08829130232334137, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:15:45.899927Z", "loop": 2546, "env_steps": 1564876799, "loss": 0.002674631541594863, "avg_return": 0.4625219702720642, "regret": 0.35099491477012634, "entropy": 0.08967647701501846, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:15:47.061200Z", "loop": 2547, "env_steps": 1565491199, "loss": 0.0025952267460525036, "avg_return": 0.45083680748939514, "regret": 0.35099491477012634, "entropy": 0.08872164785861969, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:15:48.221694Z", "loop": 2548, "env_steps": 1566105599, "loss": 0.0027270163409411907, "avg_return": 0.4424785375595093, "regret": 0.35099491477012634, "entropy": 0.09202946722507477, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:15:49.383385Z", "loop": 2549, "env_steps": 1566719999, "loss": 0.0029100081883370876, "avg_return": 0.45582008361816406, "regret": 0.35099491477012634, "entropy": 0.0954425036907196, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:15:50.598917Z", "loop": 2550, "env_steps": 1567334399, "loss": 0.002696617506444454, "avg_return": 0.4450063109397888, "regret": 0.35126325488090515, "entropy": 0.08663403987884521, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:15:51.760024Z", "loop": 2551, "env_steps": 1567948799, "loss": 0.0029700985178351402, "avg_return": 0.45376551151275635, "regret": 0.35126325488090515, "entropy": 0.08806701749563217, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:15:52.920904Z", "loop": 2552, "env_steps": 1568563199, "loss": 0.003257863922044635, "avg_return": 0.45852550864219666, "regret": 0.35126325488090515, "entropy": 0.08750718086957932, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:15:54.081781Z", "loop": 2553, "env_steps": 1569177599, "loss": 0.00319278915412724, "avg_return": 0.4438606798648834, "regret": 0.35126325488090515, "entropy": 0.08800516277551651, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:15:55.242153Z", "loop": 2554, "env_steps": 1569791999, "loss": 0.003339995862916112, "avg_return": 0.45075756311416626, "regret": 0.35126325488090515, "entropy": 0.08956649154424667, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:15:56.402902Z", "loop": 2555, "env_steps": 1570406399, "loss": 0.003557418007403612, "avg_return": 0.4486999213695526, "regret": 0.35126325488090515, "entropy": 0.09516850113868713, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:15:57.564220Z", "loop": 2556, "env_steps": 1571020799, "loss": 0.003991798032075167, "avg_return": 0.4356019198894501, "regret": 0.35126325488090515, "entropy": 0.1019783690571785, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:15:58.724068Z", "loop": 2557, "env_steps": 1571635199, "loss": 0.004303854424506426, "avg_return": 0.4466386139392853, "regret": 0.35126325488090515, "entropy": 0.10482734441757202, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:15:59.885054Z", "loop": 2558, "env_steps": 1572249599, "loss": 0.004098296165466309, "avg_return": 0.4415871202945709, "regret": 0.35126325488090515, "entropy": 0.10391012579202652, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:16:01.044965Z", "loop": 2559, "env_steps": 1572863999, "loss": 0.0030174979474395514, "avg_return": 0.4407966136932373, "regret": 0.35126325488090515, "entropy": 0.09447155147790909, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:16:02.252716Z", "loop": 2560, "env_steps": 1573478399, "loss": 0.0033547698985785246, "avg_return": 0.448648601770401, "regret": 0.3531491458415985, "entropy": 0.0937664583325386, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:16:03.413435Z", "loop": 2561, "env_steps": 1574092799, "loss": 0.0030732040759176016, "avg_return": 0.45280152559280396, "regret": 0.3531491458415985, "entropy": 0.09842797368764877, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:16:04.574659Z", "loop": 2562, "env_steps": 1574707199, "loss": 0.0030611276160925627, "avg_return": 0.45401379466056824, "regret": 0.3531491458415985, "entropy": 0.09544885158538818, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:16:05.734716Z", "loop": 2563, "env_steps": 1575321599, "loss": 0.0026536108925938606, "avg_return": 0.4585113525390625, "regret": 0.3531491458415985, "entropy": 0.09786800295114517, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:16:06.895431Z", "loop": 2564, "env_steps": 1575935999, "loss": 0.0023805703967809677, "avg_return": 0.45643219351768494, "regret": 0.3531491458415985, "entropy": 0.0946454256772995, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:16:08.056662Z", "loop": 2565, "env_steps": 1576550399, "loss": 0.002018444472923875, "avg_return": 0.45549800992012024, "regret": 0.3531491458415985, "entropy": 0.09326165914535522, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:16:09.217110Z", "loop": 2566, "env_steps": 1577164799, "loss": 0.0018236072501167655, "avg_return": 0.45127764344215393, "regret": 0.3531491458415985, "entropy": 0.09148818254470825, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:16:10.378415Z", "loop": 2567, "env_steps": 1577779199, "loss": 0.0017859697109088302, "avg_return": 0.45470306277275085, "regret": 0.3531491458415985, "entropy": 0.08473919332027435, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:16:11.539897Z", "loop": 2568, "env_steps": 1578393599, "loss": 0.0016637903172522783, "avg_return": 0.45313334465026855, "regret": 0.3531491458415985, "entropy": 0.0888451635837555, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:16:12.700266Z", "loop": 2569, "env_steps": 1579007999, "loss": 0.0014843781245872378, "avg_return": 0.45190197229385376, "regret": 0.3531491458415985, "entropy": 0.09610310941934586, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:16:13.908079Z", "loop": 2570, "env_steps": 1579622399, "loss": 0.001482869265601039, "avg_return": 0.45231643319129944, "regret": 0.3510552942752838, "entropy": 0.08988979458808899, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:16:15.068311Z", "loop": 2571, "env_steps": 1580236799, "loss": 0.001655783737078309, "avg_return": 0.45581117272377014, "regret": 0.3510552942752838, "entropy": 0.08914614468812943, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:16:16.228622Z", "loop": 2572, "env_steps": 1580851199, "loss": 0.0015231481520459056, "avg_return": 0.45141053199768066, "regret": 0.3510552942752838, "entropy": 0.09127892553806305, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:16:17.390207Z", "loop": 2573, "env_steps": 1581465599, "loss": 0.0016168771544471383, "avg_return": 0.450700581073761, "regret": 0.3510552942752838, "entropy": 0.08801726251840591, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:16:18.551823Z", "loop": 2574, "env_steps": 1582079999, "loss": 0.0017051041359081864, "avg_return": 0.4510103464126587, "regret": 0.3510552942752838, "entropy": 0.09228217601776123, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:16:19.712581Z", "loop": 2575, "env_steps": 1582694399, "loss": 0.0017804577946662903, "avg_return": 0.4508495330810547, "regret": 0.3510552942752838, "entropy": 0.09995455294847488, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:16:20.873532Z", "loop": 2576, "env_steps": 1583308799, "loss": 0.0019645821303129196, "avg_return": 0.4498564898967743, "regret": 0.3510552942752838, "entropy": 0.09550604969263077, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:16:22.036519Z", "loop": 2577, "env_steps": 1583923199, "loss": 0.001830988796427846, "avg_return": 0.45249563455581665, "regret": 0.3510552942752838, "entropy": 0.09170309454202652, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:16:23.196682Z", "loop": 2578, "env_steps": 1584537599, "loss": 0.0016429646639153361, "avg_return": 0.44960227608680725, "regret": 0.3510552942752838, "entropy": 0.09585487842559814, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:16:24.355856Z", "loop": 2579, "env_steps": 1585151999, "loss": 0.0018214574083685875, "avg_return": 0.4462059736251831, "regret": 0.3510552942752838, "entropy": 0.0952734425663948, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:16:25.564620Z", "loop": 2580, "env_steps": 1585766399, "loss": 0.0018946565687656403, "avg_return": 0.4532609283924103, "regret": 0.3520289957523346, "entropy": 0.09570255875587463, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:16:26.728262Z", "loop": 2581, "env_steps": 1586380799, "loss": 0.0017415372421965003, "avg_return": 0.456716924905777, "regret": 0.3520289957523346, "entropy": 0.09418164938688278, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:16:27.890335Z", "loop": 2582, "env_steps": 1586995199, "loss": 0.001799362595193088, "avg_return": 0.4531756639480591, "regret": 0.3520289957523346, "entropy": 0.09643463790416718, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:16:29.052144Z", "loop": 2583, "env_steps": 1587609599, "loss": 0.0018157459562644362, "avg_return": 0.4493557810783386, "regret": 0.3520289957523346, "entropy": 0.09267502278089523, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:16:30.212891Z", "loop": 2584, "env_steps": 1588223999, "loss": 0.0017115733353421092, "avg_return": 0.447770357131958, "regret": 0.3520289957523346, "entropy": 0.09660858660936356, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:16:31.375285Z", "loop": 2585, "env_steps": 1588838399, "loss": 0.0014368453994393349, "avg_return": 0.45337286591529846, "regret": 0.3520289957523346, "entropy": 0.08656192570924759, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:16:32.537158Z", "loop": 2586, "env_steps": 1589452799, "loss": 0.0018999067833647132, "avg_return": 0.45256364345550537, "regret": 0.3520289957523346, "entropy": 0.09466727823019028, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:16:33.698404Z", "loop": 2587, "env_steps": 1590067199, "loss": 0.001955726882442832, "avg_return": 0.4523104429244995, "regret": 0.3520289957523346, "entropy": 0.09237312525510788, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:16:34.859479Z", "loop": 2588, "env_steps": 1590681599, "loss": 0.0018163276836276054, "avg_return": 0.45019227266311646, "regret": 0.3520289957523346, "entropy": 0.09597410261631012, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:16:36.019825Z", "loop": 2589, "env_steps": 1591295999, "loss": 0.0018064490286633372, "avg_return": 0.45855119824409485, "regret": 0.3520289957523346, "entropy": 0.08587798476219177, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:16:37.230306Z", "loop": 2590, "env_steps": 1591910399, "loss": 0.0015829941257834435, "avg_return": 0.4469395577907562, "regret": 0.3512057960033417, "entropy": 0.09140224754810333, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:16:38.391707Z", "loop": 2591, "env_steps": 1592524799, "loss": 0.0017985351150855422, "avg_return": 0.45882782340049744, "regret": 0.3512057960033417, "entropy": 0.09159067273139954, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:16:39.553487Z", "loop": 2592, "env_steps": 1593139199, "loss": 0.0014368308475241065, "avg_return": 0.45502471923828125, "regret": 0.3512057960033417, "entropy": 0.09280704706907272, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:16:40.713365Z", "loop": 2593, "env_steps": 1593753599, "loss": 0.0017240071902051568, "avg_return": 0.4494578242301941, "regret": 0.3512057960033417, "entropy": 0.0936538577079773, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:16:41.875209Z", "loop": 2594, "env_steps": 1594367999, "loss": 0.0014768667751923203, "avg_return": 0.4538375437259674, "regret": 0.3512057960033417, "entropy": 0.09053342044353485, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:16:43.036218Z", "loop": 2595, "env_steps": 1594982399, "loss": 0.0017792930593714118, "avg_return": 0.4591258764266968, "regret": 0.3512057960033417, "entropy": 0.09310077875852585, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:16:44.196699Z", "loop": 2596, "env_steps": 1595596799, "loss": 0.001988242147490382, "avg_return": 0.4514218270778656, "regret": 0.3512057960033417, "entropy": 0.09419114142656326, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:16:45.356554Z", "loop": 2597, "env_steps": 1596211199, "loss": 0.0017010311130434275, "avg_return": 0.45600587129592896, "regret": 0.3512057960033417, "entropy": 0.09644198417663574, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:16:46.516923Z", "loop": 2598, "env_steps": 1596825599, "loss": 0.0016701510176062584, "avg_return": 0.459660142660141, "regret": 0.3512057960033417, "entropy": 0.09361860156059265, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:16:47.678476Z", "loop": 2599, "env_steps": 1597439999, "loss": 0.00183075200766325, "avg_return": 0.44869405031204224, "regret": 0.3512057960033417, "entropy": 0.09179069846868515, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:16:48.885673Z", "loop": 2600, "env_steps": 1598054399, "loss": 0.0018176184967160225, "avg_return": 0.4486098885536194, "regret": 0.3509843945503235, "entropy": 0.09303352981805801, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:16:50.050224Z", "loop": 2601, "env_steps": 1598668799, "loss": 0.0019469145918264985, "avg_return": 0.45825329422950745, "regret": 0.3509843945503235, "entropy": 0.0898609310388565, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:16:51.210784Z", "loop": 2602, "env_steps": 1599283199, "loss": 0.0019464934011921287, "avg_return": 0.4495942294597626, "regret": 0.3509843945503235, "entropy": 0.09723040461540222, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:16:52.372523Z", "loop": 2603, "env_steps": 1599897599, "loss": 0.002176334848627448, "avg_return": 0.45158055424690247, "regret": 0.3509843945503235, "entropy": 0.09470558911561966, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:16:53.536804Z", "loop": 2604, "env_steps": 1600511999, "loss": 0.0020315246656537056, "avg_return": 0.4635595679283142, "regret": 0.3509843945503235, "entropy": 0.10026277601718903, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:16:54.699258Z", "loop": 2605, "env_steps": 1601126399, "loss": 0.0020670376252382994, "avg_return": 0.4518931806087494, "regret": 0.3509843945503235, "entropy": 0.08919492363929749, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:16:55.861441Z", "loop": 2606, "env_steps": 1601740799, "loss": 0.0021432209759950638, "avg_return": 0.45407360792160034, "regret": 0.3509843945503235, "entropy": 0.09261464327573776, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:16:57.021278Z", "loop": 2607, "env_steps": 1602355199, "loss": 0.0025014046113938093, "avg_return": 0.45036444067955017, "regret": 0.3509843945503235, "entropy": 0.09612659364938736, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:16:58.183681Z", "loop": 2608, "env_steps": 1602969599, "loss": 0.002610659459605813, "avg_return": 0.4529722332954407, "regret": 0.3509843945503235, "entropy": 0.10098449140787125, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:16:59.345430Z", "loop": 2609, "env_steps": 1603583999, "loss": 0.002978472737595439, "avg_return": 0.45586782693862915, "regret": 0.3509843945503235, "entropy": 0.09512294828891754, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:17:00.560258Z", "loop": 2610, "env_steps": 1604198399, "loss": 0.0025088682305067778, "avg_return": 0.45305493474006653, "regret": 0.35125041007995605, "entropy": 0.09629715234041214, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:17:01.722040Z", "loop": 2611, "env_steps": 1604812799, "loss": 0.00232694111764431, "avg_return": 0.45573508739471436, "regret": 0.35125041007995605, "entropy": 0.09120684117078781, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:17:02.883017Z", "loop": 2612, "env_steps": 1605427199, "loss": 0.0020415231119841337, "avg_return": 0.4585631489753723, "regret": 0.35125041007995605, "entropy": 0.08811083436012268, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:17:04.044561Z", "loop": 2613, "env_steps": 1606041599, "loss": 0.0018018133705481887, "avg_return": 0.45321401953697205, "regret": 0.35125041007995605, "entropy": 0.0890364721417427, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:17:05.204542Z", "loop": 2614, "env_steps": 1606655999, "loss": 0.0018262576777487993, "avg_return": 0.4533182382583618, "regret": 0.35125041007995605, "entropy": 0.08997992426156998, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:17:06.365771Z", "loop": 2615, "env_steps": 1607270399, "loss": 0.0018116930732503533, "avg_return": 0.45500311255455017, "regret": 0.35125041007995605, "entropy": 0.08482061326503754, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:17:07.525688Z", "loop": 2616, "env_steps": 1607884799, "loss": 0.0016327587654814124, "avg_return": 0.4615306258201599, "regret": 0.35125041007995605, "entropy": 0.08549270033836365, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:17:08.690457Z", "loop": 2617, "env_steps": 1608499199, "loss": 0.001712729106657207, "avg_return": 0.4522480368614197, "regret": 0.35125041007995605, "entropy": 0.0886007621884346, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:17:09.851903Z", "loop": 2618, "env_steps": 1609113599, "loss": 0.0018315258203074336, "avg_return": 0.45000579953193665, "regret": 0.35125041007995605, "entropy": 0.09147215634584427, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:17:11.012549Z", "loop": 2619, "env_steps": 1609727999, "loss": 0.0018636872991919518, "avg_return": 0.4501246213912964, "regret": 0.35125041007995605, "entropy": 0.09915938973426819, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:17:12.221615Z", "loop": 2620, "env_steps": 1610342399, "loss": 0.001803682534955442, "avg_return": 0.45341721177101135, "regret": 0.3512636125087738, "entropy": 0.09254387766122818, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:17:13.382891Z", "loop": 2621, "env_steps": 1610956799, "loss": 0.0014744221698492765, "avg_return": 0.45771342515945435, "regret": 0.3512636125087738, "entropy": 0.09422655403614044, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:17:14.543954Z", "loop": 2622, "env_steps": 1611571199, "loss": 0.0015951868845149875, "avg_return": 0.4539969861507416, "regret": 0.3512636125087738, "entropy": 0.08609970659017563, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:17:15.702991Z", "loop": 2623, "env_steps": 1612185599, "loss": 0.001490080263465643, "avg_return": 0.4504203498363495, "regret": 0.3512636125087738, "entropy": 0.08912328630685806, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:17:16.863904Z", "loop": 2624, "env_steps": 1612799999, "loss": 0.001531817833893001, "avg_return": 0.45302075147628784, "regret": 0.3512636125087738, "entropy": 0.08779233694076538, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:17:18.023573Z", "loop": 2625, "env_steps": 1613414399, "loss": 0.0017501472029834986, "avg_return": 0.449096143245697, "regret": 0.3512636125087738, "entropy": 0.0865006223320961, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:17:19.184142Z", "loop": 2626, "env_steps": 1614028799, "loss": 0.0017691761022433639, "avg_return": 0.4504263401031494, "regret": 0.3512636125087738, "entropy": 0.07887795567512512, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:17:20.344355Z", "loop": 2627, "env_steps": 1614643199, "loss": 0.0016629438614472747, "avg_return": 0.4545213282108307, "regret": 0.3512636125087738, "entropy": 0.08095932006835938, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:17:21.504398Z", "loop": 2628, "env_steps": 1615257599, "loss": 0.0015672225272282958, "avg_return": 0.45389324426651, "regret": 0.3512636125087738, "entropy": 0.0792049914598465, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:17:22.665498Z", "loop": 2629, "env_steps": 1615871999, "loss": 0.0016289519844576716, "avg_return": 0.45314687490463257, "regret": 0.3512636125087738, "entropy": 0.08297913521528244, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:17:23.870711Z", "loop": 2630, "env_steps": 1616486399, "loss": 0.0016421031905338168, "avg_return": 0.44951131939888, "regret": 0.35159680247306824, "entropy": 0.08093270659446716, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:17:25.034679Z", "loop": 2631, "env_steps": 1617100799, "loss": 0.0016712757060304284, "avg_return": 0.4521563947200775, "regret": 0.35159680247306824, "entropy": 0.08216206729412079, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:17:26.195278Z", "loop": 2632, "env_steps": 1617715199, "loss": 0.0014079184038564563, "avg_return": 0.4483376145362854, "regret": 0.35159680247306824, "entropy": 0.08241154998540878, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:17:27.355977Z", "loop": 2633, "env_steps": 1618329599, "loss": 0.0014202006859704852, "avg_return": 0.45608124136924744, "regret": 0.35159680247306824, "entropy": 0.07512159645557404, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:17:28.516761Z", "loop": 2634, "env_steps": 1618943999, "loss": 0.0012482417514547706, "avg_return": 0.45277151465415955, "regret": 0.35159680247306824, "entropy": 0.08846322447061539, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:17:29.678105Z", "loop": 2635, "env_steps": 1619558399, "loss": 0.0014364438829943538, "avg_return": 0.4515746533870697, "regret": 0.35159680247306824, "entropy": 0.09042321145534515, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:17:30.838667Z", "loop": 2636, "env_steps": 1620172799, "loss": 0.0011638518190011382, "avg_return": 0.45026907324790955, "regret": 0.35159680247306824, "entropy": 0.08158504962921143, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:17:31.997333Z", "loop": 2637, "env_steps": 1620787199, "loss": 0.0015514726983383298, "avg_return": 0.44988465309143066, "regret": 0.35159680247306824, "entropy": 0.08767920732498169, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:17:33.157884Z", "loop": 2638, "env_steps": 1621401599, "loss": 0.0014525956939905882, "avg_return": 0.4509192407131195, "regret": 0.35159680247306824, "entropy": 0.08257273584604263, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:17:34.317739Z", "loop": 2639, "env_steps": 1622015999, "loss": 0.001418513711541891, "avg_return": 0.44571229815483093, "regret": 0.35159680247306824, "entropy": 0.08609192073345184, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:17:35.525160Z", "loop": 2640, "env_steps": 1622630399, "loss": 0.0013065529055893421, "avg_return": 0.4465719759464264, "regret": 0.3517736494541168, "entropy": 0.078666552901268, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:17:36.687845Z", "loop": 2641, "env_steps": 1623244799, "loss": 0.001302453689277172, "avg_return": 0.4522896409034729, "regret": 0.3517736494541168, "entropy": 0.08487046509981155, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:17:37.849899Z", "loop": 2642, "env_steps": 1623859199, "loss": 0.001355574349872768, "avg_return": 0.4578475058078766, "regret": 0.3517736494541168, "entropy": 0.07714632153511047, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:17:39.010853Z", "loop": 2643, "env_steps": 1624473599, "loss": 0.0013860630569979548, "avg_return": 0.4484283924102783, "regret": 0.3517736494541168, "entropy": 0.08427077531814575, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:17:40.174468Z", "loop": 2644, "env_steps": 1625087999, "loss": 0.001510248752310872, "avg_return": 0.446514755487442, "regret": 0.3517736494541168, "entropy": 0.08305522799491882, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:17:41.337021Z", "loop": 2645, "env_steps": 1625702399, "loss": 0.0016987965209409595, "avg_return": 0.4508551061153412, "regret": 0.3517736494541168, "entropy": 0.08451320976018906, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:17:42.497287Z", "loop": 2646, "env_steps": 1626316799, "loss": 0.002182444790378213, "avg_return": 0.45309123396873474, "regret": 0.3517736494541168, "entropy": 0.07825542986392975, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:17:43.659715Z", "loop": 2647, "env_steps": 1626931199, "loss": 0.002178232418373227, "avg_return": 0.45502781867980957, "regret": 0.3517736494541168, "entropy": 0.0797167494893074, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:17:44.820992Z", "loop": 2648, "env_steps": 1627545599, "loss": 0.0024017514660954475, "avg_return": 0.46028077602386475, "regret": 0.3517736494541168, "entropy": 0.07815922051668167, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:17:45.983621Z", "loop": 2649, "env_steps": 1628159999, "loss": 0.002760132774710655, "avg_return": 0.45243266224861145, "regret": 0.3517736494541168, "entropy": 0.0790528655052185, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:17:47.197398Z", "loop": 2650, "env_steps": 1628774399, "loss": 0.002709783846512437, "avg_return": 0.45285916328430176, "regret": 0.3515811264514923, "entropy": 0.07878126204013824, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:17:48.358171Z", "loop": 2651, "env_steps": 1629388799, "loss": 0.003118286607787013, "avg_return": 0.4502483308315277, "regret": 0.3515811264514923, "entropy": 0.08090159296989441, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:17:49.518557Z", "loop": 2652, "env_steps": 1630003199, "loss": 0.003198121441528201, "avg_return": 0.4489758312702179, "regret": 0.3515811264514923, "entropy": 0.08491149544715881, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:17:50.679846Z", "loop": 2653, "env_steps": 1630617599, "loss": 0.003245748346671462, "avg_return": 0.44921785593032837, "regret": 0.3515811264514923, "entropy": 0.08421387523412704, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:17:51.842008Z", "loop": 2654, "env_steps": 1631231999, "loss": 0.0033748627174645662, "avg_return": 0.4523710310459137, "regret": 0.3515811264514923, "entropy": 0.08435136824846268, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:17:53.002662Z", "loop": 2655, "env_steps": 1631846399, "loss": 0.0033561517484486103, "avg_return": 0.4516816735267639, "regret": 0.3515811264514923, "entropy": 0.08182618021965027, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:17:54.163959Z", "loop": 2656, "env_steps": 1632460799, "loss": 0.0033636149019002914, "avg_return": 0.45307648181915283, "regret": 0.3515811264514923, "entropy": 0.08338945358991623, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:17:55.324512Z", "loop": 2657, "env_steps": 1633075199, "loss": 0.0024606864899396896, "avg_return": 0.45146435499191284, "regret": 0.3515811264514923, "entropy": 0.07700584828853607, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:17:56.486391Z", "loop": 2658, "env_steps": 1633689599, "loss": 0.0021342465188354254, "avg_return": 0.44999513030052185, "regret": 0.3515811264514923, "entropy": 0.07171542197465897, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:17:57.649459Z", "loop": 2659, "env_steps": 1634303999, "loss": 0.002016292652115226, "avg_return": 0.4483696520328522, "regret": 0.3515811264514923, "entropy": 0.07197647541761398, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:17:58.855309Z", "loop": 2660, "env_steps": 1634918399, "loss": 0.002173475455492735, "avg_return": 0.45565637946128845, "regret": 0.3510489761829376, "entropy": 0.08125395327806473, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:18:00.017097Z", "loop": 2661, "env_steps": 1635532799, "loss": 0.0015922423917800188, "avg_return": 0.4466569125652313, "regret": 0.3510489761829376, "entropy": 0.08228391408920288, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:18:01.176849Z", "loop": 2662, "env_steps": 1636147199, "loss": 0.001305056270211935, "avg_return": 0.4602993428707123, "regret": 0.3510489761829376, "entropy": 0.08480393886566162, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:18:02.336648Z", "loop": 2663, "env_steps": 1636761599, "loss": 0.0014948589960113168, "avg_return": 0.4452167749404907, "regret": 0.3510489761829376, "entropy": 0.08202376961708069, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:18:03.495963Z", "loop": 2664, "env_steps": 1637375999, "loss": 0.0018501243321225047, "avg_return": 0.4530273675918579, "regret": 0.3510489761829376, "entropy": 0.09178104251623154, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:18:04.656587Z", "loop": 2665, "env_steps": 1637990399, "loss": 0.0014596543041989207, "avg_return": 0.45346346497535706, "regret": 0.3510489761829376, "entropy": 0.08561576902866364, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:18:05.815715Z", "loop": 2666, "env_steps": 1638604799, "loss": 0.0009781451663002372, "avg_return": 0.44738373160362244, "regret": 0.3510489761829376, "entropy": 0.07928845286369324, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:18:06.976043Z", "loop": 2667, "env_steps": 1639219199, "loss": 0.0008681568433530629, "avg_return": 0.4438445270061493, "regret": 0.3510489761829376, "entropy": 0.07378121465444565, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:18:08.137787Z", "loop": 2668, "env_steps": 1639833599, "loss": 0.0009571781265549362, "avg_return": 0.4533620774745941, "regret": 0.3510489761829376, "entropy": 0.07367216795682907, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:18:09.298124Z", "loop": 2669, "env_steps": 1640447999, "loss": 0.0010949326679110527, "avg_return": 0.4539402425289154, "regret": 0.3510489761829376, "entropy": 0.07859735935926437, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:18:10.505314Z", "loop": 2670, "env_steps": 1641062399, "loss": 0.0013832193799316883, "avg_return": 0.45623379945755005, "regret": 0.35391587018966675, "entropy": 0.07987294346094131, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:18:11.666410Z", "loop": 2671, "env_steps": 1641676799, "loss": 0.0016974961617961526, "avg_return": 0.4491375982761383, "regret": 0.35391587018966675, "entropy": 0.09086894989013672, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:18:12.831191Z", "loop": 2672, "env_steps": 1642291199, "loss": 0.002001386834308505, "avg_return": 0.44640401005744934, "regret": 0.35391587018966675, "entropy": 0.08916269242763519, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:18:13.991823Z", "loop": 2673, "env_steps": 1642905599, "loss": 0.0020008385181427, "avg_return": 0.44657185673713684, "regret": 0.35391587018966675, "entropy": 0.08505427837371826, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:18:15.154120Z", "loop": 2674, "env_steps": 1643519999, "loss": 0.001630230457521975, "avg_return": 0.451670378446579, "regret": 0.35391587018966675, "entropy": 0.08244643360376358, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:18:16.314898Z", "loop": 2675, "env_steps": 1644134399, "loss": 0.0015193111030384898, "avg_return": 0.450447142124176, "regret": 0.35391587018966675, "entropy": 0.08717693388462067, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:18:17.477276Z", "loop": 2676, "env_steps": 1644748799, "loss": 0.0016406470676884055, "avg_return": 0.44515952467918396, "regret": 0.35391587018966675, "entropy": 0.08447803556919098, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:18:18.640595Z", "loop": 2677, "env_steps": 1645363199, "loss": 0.001537470263428986, "avg_return": 0.45174190402030945, "regret": 0.35391587018966675, "entropy": 0.0798807442188263, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:18:19.801547Z", "loop": 2678, "env_steps": 1645977599, "loss": 0.0012684756657108665, "avg_return": 0.4473963975906372, "regret": 0.35391587018966675, "entropy": 0.0854090005159378, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:18:20.963112Z", "loop": 2679, "env_steps": 1646591999, "loss": 0.0014160833088681102, "avg_return": 0.45074912905693054, "regret": 0.35391587018966675, "entropy": 0.07967919111251831, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:18:22.179184Z", "loop": 2680, "env_steps": 1647206399, "loss": 0.0015543604968115687, "avg_return": 0.4493621289730072, "regret": 0.3527261018753052, "entropy": 0.07976988703012466, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:18:23.340782Z", "loop": 2681, "env_steps": 1647820799, "loss": 0.0013332826783880591, "avg_return": 0.45195820927619934, "regret": 0.3527261018753052, "entropy": 0.07896789163351059, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:18:24.500989Z", "loop": 2682, "env_steps": 1648435199, "loss": 0.0011405382538214326, "avg_return": 0.4513518810272217, "regret": 0.3527261018753052, "entropy": 0.08138999342918396, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:18:25.661732Z", "loop": 2683, "env_steps": 1649049599, "loss": 0.0010960646905004978, "avg_return": 0.4574037194252014, "regret": 0.3527261018753052, "entropy": 0.07520011067390442, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:18:26.822672Z", "loop": 2684, "env_steps": 1649663999, "loss": 0.0008458938682451844, "avg_return": 0.45276662707328796, "regret": 0.3527261018753052, "entropy": 0.07855533808469772, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:18:27.983504Z", "loop": 2685, "env_steps": 1650278399, "loss": 0.0009879866847768426, "avg_return": 0.45881327986717224, "regret": 0.3527261018753052, "entropy": 0.07871820032596588, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:18:29.145131Z", "loop": 2686, "env_steps": 1650892799, "loss": 0.0010274695232510567, "avg_return": 0.4558500349521637, "regret": 0.3527261018753052, "entropy": 0.07803383469581604, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:18:30.305516Z", "loop": 2687, "env_steps": 1651507199, "loss": 0.0010816707508638501, "avg_return": 0.4498380720615387, "regret": 0.3527261018753052, "entropy": 0.07778307795524597, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:18:31.466607Z", "loop": 2688, "env_steps": 1652121599, "loss": 0.0009538499871268868, "avg_return": 0.45120930671691895, "regret": 0.3527261018753052, "entropy": 0.07850272208452225, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:18:32.628825Z", "loop": 2689, "env_steps": 1652735999, "loss": 0.001033794367685914, "avg_return": 0.45504528284072876, "regret": 0.3527261018753052, "entropy": 0.07496006041765213, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:18:33.834792Z", "loop": 2690, "env_steps": 1653350399, "loss": 0.001171671668998897, "avg_return": 0.45371389389038086, "regret": 0.35106566548347473, "entropy": 0.07755623012781143, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:18:34.996156Z", "loop": 2691, "env_steps": 1653964799, "loss": 0.0011153764789924026, "avg_return": 0.450198769569397, "regret": 0.35106566548347473, "entropy": 0.07960686832666397, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:18:36.157123Z", "loop": 2692, "env_steps": 1654579199, "loss": 0.0010068429401144385, "avg_return": 0.4479699730873108, "regret": 0.35106566548347473, "entropy": 0.08024749159812927, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:18:37.317406Z", "loop": 2693, "env_steps": 1655193599, "loss": 0.0010625469731166959, "avg_return": 0.45205965638160706, "regret": 0.35106566548347473, "entropy": 0.08207006007432938, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:18:38.477548Z", "loop": 2694, "env_steps": 1655807999, "loss": 0.0011301939375698566, "avg_return": 0.4584483504295349, "regret": 0.35106566548347473, "entropy": 0.08005259931087494, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:18:39.638849Z", "loop": 2695, "env_steps": 1656422399, "loss": 0.0011738428147509694, "avg_return": 0.4532035291194916, "regret": 0.35106566548347473, "entropy": 0.08235914260149002, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:18:40.799206Z", "loop": 2696, "env_steps": 1657036799, "loss": 0.0012196473544463515, "avg_return": 0.4541102647781372, "regret": 0.35106566548347473, "entropy": 0.08294445276260376, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:18:41.960652Z", "loop": 2697, "env_steps": 1657651199, "loss": 0.0010597832733765244, "avg_return": 0.45277273654937744, "regret": 0.35106566548347473, "entropy": 0.08171061426401138, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:18:43.120828Z", "loop": 2698, "env_steps": 1658265599, "loss": 0.0010432158596813679, "avg_return": 0.4554918110370636, "regret": 0.35106566548347473, "entropy": 0.08108694851398468, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:18:44.281638Z", "loop": 2699, "env_steps": 1658879999, "loss": 0.000998915289528668, "avg_return": 0.446546345949173, "regret": 0.35106566548347473, "entropy": 0.08235649764537811, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:18:45.488134Z", "loop": 2700, "env_steps": 1659494399, "loss": 0.001018290757201612, "avg_return": 0.45563405752182007, "regret": 0.35103169083595276, "entropy": 0.08166883140802383, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:18:46.651798Z", "loop": 2701, "env_steps": 1660108799, "loss": 0.001030946965329349, "avg_return": 0.4519459009170532, "regret": 0.35103169083595276, "entropy": 0.07720459997653961, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:18:47.810617Z", "loop": 2702, "env_steps": 1660723199, "loss": 0.0009750103927217424, "avg_return": 0.452070415019989, "regret": 0.35103169083595276, "entropy": 0.07960838824510574, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:18:48.971295Z", "loop": 2703, "env_steps": 1661337599, "loss": 0.0010503192897886038, "avg_return": 0.45455947518348694, "regret": 0.35103169083595276, "entropy": 0.07958824187517166, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:18:50.133039Z", "loop": 2704, "env_steps": 1661951999, "loss": 0.0010001563932746649, "avg_return": 0.4530644714832306, "regret": 0.35103169083595276, "entropy": 0.07967043668031693, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:18:51.293626Z", "loop": 2705, "env_steps": 1662566399, "loss": 0.0010207415325567126, "avg_return": 0.4497728645801544, "regret": 0.35103169083595276, "entropy": 0.08316446840763092, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:18:52.454928Z", "loop": 2706, "env_steps": 1663180799, "loss": 0.0010126176057383418, "avg_return": 0.4506590962409973, "regret": 0.35103169083595276, "entropy": 0.08198938518762589, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:18:53.615219Z", "loop": 2707, "env_steps": 1663795199, "loss": 0.0009821647545322776, "avg_return": 0.4569041132926941, "regret": 0.35103169083595276, "entropy": 0.0863504409790039, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:18:54.775804Z", "loop": 2708, "env_steps": 1664409599, "loss": 0.0010043998481705785, "avg_return": 0.4584519565105438, "regret": 0.35103169083595276, "entropy": 0.08079260587692261, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:18:55.936997Z", "loop": 2709, "env_steps": 1665023999, "loss": 0.0007463878719136119, "avg_return": 0.45030295848846436, "regret": 0.35103169083595276, "entropy": 0.07914908975362778, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:18:57.153140Z", "loop": 2710, "env_steps": 1665638399, "loss": 0.0010525211691856384, "avg_return": 0.4505250155925751, "regret": 0.3509978652000427, "entropy": 0.08371762186288834, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:18:58.316641Z", "loop": 2711, "env_steps": 1666252799, "loss": 0.0011376189067959785, "avg_return": 0.45630183815956116, "regret": 0.3509978652000427, "entropy": 0.08300209790468216, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:18:59.477490Z", "loop": 2712, "env_steps": 1666867199, "loss": 0.001002538949251175, "avg_return": 0.4573196470737457, "regret": 0.3509978652000427, "entropy": 0.08406639844179153, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:19:00.643207Z", "loop": 2713, "env_steps": 1667481599, "loss": 0.0010166788706555963, "avg_return": 0.45063507556915283, "regret": 0.3509978652000427, "entropy": 0.08383459597826004, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:19:01.802351Z", "loop": 2714, "env_steps": 1668095999, "loss": 0.0010777373099699616, "avg_return": 0.4504631757736206, "regret": 0.3509978652000427, "entropy": 0.0825166329741478, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:19:02.962336Z", "loop": 2715, "env_steps": 1668710399, "loss": 0.0013762091984972358, "avg_return": 0.4550086557865143, "regret": 0.3509978652000427, "entropy": 0.08995512872934341, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:19:04.123357Z", "loop": 2716, "env_steps": 1669324799, "loss": 0.001524049206636846, "avg_return": 0.4606521725654602, "regret": 0.3509978652000427, "entropy": 0.0821998119354248, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:19:05.289372Z", "loop": 2717, "env_steps": 1669939199, "loss": 0.0015780780231580138, "avg_return": 0.45932161808013916, "regret": 0.3509978652000427, "entropy": 0.08890454471111298, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:19:06.451854Z", "loop": 2718, "env_steps": 1670553599, "loss": 0.0016677266685292125, "avg_return": 0.45745849609375, "regret": 0.3509978652000427, "entropy": 0.08580014109611511, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:19:07.612726Z", "loop": 2719, "env_steps": 1671167999, "loss": 0.0017271025571972132, "avg_return": 0.44606080651283264, "regret": 0.3509978652000427, "entropy": 0.09855307638645172, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:19:08.828429Z", "loop": 2720, "env_steps": 1671782399, "loss": 0.0018895380198955536, "avg_return": 0.4532831013202667, "regret": 0.35070717334747314, "entropy": 0.09744391590356827, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:19:09.991219Z", "loop": 2721, "env_steps": 1672396799, "loss": 0.001849423162639141, "avg_return": 0.45496460795402527, "regret": 0.35070717334747314, "entropy": 0.09333886206150055, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:19:11.154308Z", "loop": 2722, "env_steps": 1673011199, "loss": 0.0020928289741277695, "avg_return": 0.4531485140323639, "regret": 0.35070717334747314, "entropy": 0.09694408625364304, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:19:12.317421Z", "loop": 2723, "env_steps": 1673625599, "loss": 0.0022222124971449375, "avg_return": 0.45420727133750916, "regret": 0.35070717334747314, "entropy": 0.09623761475086212, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:19:13.478015Z", "loop": 2724, "env_steps": 1674239999, "loss": 0.0020286792423576117, "avg_return": 0.44899699091911316, "regret": 0.35070717334747314, "entropy": 0.09643389284610748, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:19:14.639434Z", "loop": 2725, "env_steps": 1674854399, "loss": 0.002025602851063013, "avg_return": 0.44941967725753784, "regret": 0.35070717334747314, "entropy": 0.10201699286699295, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:19:15.799525Z", "loop": 2726, "env_steps": 1675468799, "loss": 0.0023477296344935894, "avg_return": 0.4538823664188385, "regret": 0.35070717334747314, "entropy": 0.0998651534318924, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:19:16.959921Z", "loop": 2727, "env_steps": 1676083199, "loss": 0.0028452498372644186, "avg_return": 0.45369911193847656, "regret": 0.35070717334747314, "entropy": 0.10398027300834656, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:19:18.121652Z", "loop": 2728, "env_steps": 1676697599, "loss": 0.002389392349869013, "avg_return": 0.45672085881233215, "regret": 0.35070717334747314, "entropy": 0.10509015619754791, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:19:19.281812Z", "loop": 2729, "env_steps": 1677311999, "loss": 0.0024858179967850447, "avg_return": 0.4582396149635315, "regret": 0.35070717334747314, "entropy": 0.09346380829811096, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:19:20.489399Z", "loop": 2730, "env_steps": 1677926399, "loss": 0.002717584138736129, "avg_return": 0.44755473732948303, "regret": 0.351693719625473, "entropy": 0.10445821285247803, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:19:21.650655Z", "loop": 2731, "env_steps": 1678540799, "loss": 0.0023039039224386215, "avg_return": 0.4513404369354248, "regret": 0.351693719625473, "entropy": 0.10124029964208603, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:19:22.812023Z", "loop": 2732, "env_steps": 1679155199, "loss": 0.0023731631226837635, "avg_return": 0.45375338196754456, "regret": 0.351693719625473, "entropy": 0.10265158861875534, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:19:23.972226Z", "loop": 2733, "env_steps": 1679769599, "loss": 0.002293471246957779, "avg_return": 0.4524042308330536, "regret": 0.351693719625473, "entropy": 0.10360373556613922, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:19:25.133630Z", "loop": 2734, "env_steps": 1680383999, "loss": 0.002276296727359295, "avg_return": 0.4494088888168335, "regret": 0.351693719625473, "entropy": 0.10284510254859924, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:19:26.294658Z", "loop": 2735, "env_steps": 1680998399, "loss": 0.0020147745963186026, "avg_return": 0.4582562744617462, "regret": 0.351693719625473, "entropy": 0.09006518125534058, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:19:27.456649Z", "loop": 2736, "env_steps": 1681612799, "loss": 0.0017024849075824022, "avg_return": 0.45504578948020935, "regret": 0.351693719625473, "entropy": 0.0927586480975151, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:19:28.618520Z", "loop": 2737, "env_steps": 1682227199, "loss": 0.0017963709542527795, "avg_return": 0.4505011737346649, "regret": 0.351693719625473, "entropy": 0.0975370854139328, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:19:29.778455Z", "loop": 2738, "env_steps": 1682841599, "loss": 0.0017821133369579911, "avg_return": 0.4540783166885376, "regret": 0.351693719625473, "entropy": 0.0936129242181778, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:19:30.940355Z", "loop": 2739, "env_steps": 1683455999, "loss": 0.0017381560755893588, "avg_return": 0.44381532073020935, "regret": 0.351693719625473, "entropy": 0.09769122302532196, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:19:32.148286Z", "loop": 2740, "env_steps": 1684070399, "loss": 0.0019006718648597598, "avg_return": 0.45766714215278625, "regret": 0.35075387358665466, "entropy": 0.08933727443218231, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:19:33.310245Z", "loop": 2741, "env_steps": 1684684799, "loss": 0.001656787353567779, "avg_return": 0.4558049738407135, "regret": 0.35075387358665466, "entropy": 0.08614128828048706, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:19:34.471052Z", "loop": 2742, "env_steps": 1685299199, "loss": 0.0014913417398929596, "avg_return": 0.4476149082183838, "regret": 0.35075387358665466, "entropy": 0.09218137711286545, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:19:35.632134Z", "loop": 2743, "env_steps": 1685913599, "loss": 0.0015594966243952513, "avg_return": 0.4601249396800995, "regret": 0.35075387358665466, "entropy": 0.08698193728923798, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:19:36.792595Z", "loop": 2744, "env_steps": 1686527999, "loss": 0.0015758791705593467, "avg_return": 0.4567429721355438, "regret": 0.35075387358665466, "entropy": 0.08394613862037659, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:19:37.956579Z", "loop": 2745, "env_steps": 1687142399, "loss": 0.0017251595854759216, "avg_return": 0.46194347739219666, "regret": 0.35075387358665466, "entropy": 0.08606915920972824, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:19:39.118565Z", "loop": 2746, "env_steps": 1687756799, "loss": 0.001542135956697166, "avg_return": 0.4586334228515625, "regret": 0.35075387358665466, "entropy": 0.0850372314453125, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:19:40.279141Z", "loop": 2747, "env_steps": 1688371199, "loss": 0.0017410122090950608, "avg_return": 0.45945191383361816, "regret": 0.35075387358665466, "entropy": 0.08910124003887177, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:19:41.441878Z", "loop": 2748, "env_steps": 1688985599, "loss": 0.0015534560661762953, "avg_return": 0.4530509412288666, "regret": 0.35075387358665466, "entropy": 0.08759111166000366, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:19:42.605069Z", "loop": 2749, "env_steps": 1689599999, "loss": 0.0017354745650663972, "avg_return": 0.4569113850593567, "regret": 0.35075387358665466, "entropy": 0.09424547106027603, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:19:43.820090Z", "loop": 2750, "env_steps": 1690214399, "loss": 0.0017326644156128168, "avg_return": 0.45007219910621643, "regret": 0.3508816957473755, "entropy": 0.09156414866447449, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:19:44.981265Z", "loop": 2751, "env_steps": 1690828799, "loss": 0.0016588751459494233, "avg_return": 0.4509154260158539, "regret": 0.3508816957473755, "entropy": 0.08869363367557526, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:19:46.142595Z", "loop": 2752, "env_steps": 1691443199, "loss": 0.001712021417915821, "avg_return": 0.4528871774673462, "regret": 0.3508816957473755, "entropy": 0.0929163247346878, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:19:47.305737Z", "loop": 2753, "env_steps": 1692057599, "loss": 0.001687651383690536, "avg_return": 0.4563746750354767, "regret": 0.3508816957473755, "entropy": 0.0925852581858635, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:19:48.466962Z", "loop": 2754, "env_steps": 1692671999, "loss": 0.0017606699839234352, "avg_return": 0.4532710313796997, "regret": 0.3508816957473755, "entropy": 0.09562181681394577, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:19:49.629130Z", "loop": 2755, "env_steps": 1693286399, "loss": 0.0018442001892253757, "avg_return": 0.45427998900413513, "regret": 0.3508816957473755, "entropy": 0.08988304436206818, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:19:50.789261Z", "loop": 2756, "env_steps": 1693900799, "loss": 0.0019750322680920362, "avg_return": 0.4585011303424835, "regret": 0.3508816957473755, "entropy": 0.09192166477441788, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:19:51.950592Z", "loop": 2757, "env_steps": 1694515199, "loss": 0.001967964693903923, "avg_return": 0.4560681879520416, "regret": 0.3508816957473755, "entropy": 0.08835513144731522, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:19:53.111594Z", "loop": 2758, "env_steps": 1695129599, "loss": 0.001936674932949245, "avg_return": 0.45242777466773987, "regret": 0.3508816957473755, "entropy": 0.09181239455938339, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:19:54.271825Z", "loop": 2759, "env_steps": 1695743999, "loss": 0.0019146911799907684, "avg_return": 0.45295870304107666, "regret": 0.3508816957473755, "entropy": 0.09405378252267838, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:19:55.481298Z", "loop": 2760, "env_steps": 1696358399, "loss": 0.0018540535820648074, "avg_return": 0.45138755440711975, "regret": 0.35094013810157776, "entropy": 0.09307856857776642, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:19:56.641963Z", "loop": 2761, "env_steps": 1696972799, "loss": 0.0019694564398378134, "avg_return": 0.45757782459259033, "regret": 0.35094013810157776, "entropy": 0.09330391138792038, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:19:57.803248Z", "loop": 2762, "env_steps": 1697587199, "loss": 0.0016489143017679453, "avg_return": 0.45483583211898804, "regret": 0.35094013810157776, "entropy": 0.09255219250917435, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:19:58.963003Z", "loop": 2763, "env_steps": 1698201599, "loss": 0.0018273221794515848, "avg_return": 0.4503714144229889, "regret": 0.35094013810157776, "entropy": 0.0900324359536171, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:20:00.124364Z", "loop": 2764, "env_steps": 1698815999, "loss": 0.0017469251761212945, "avg_return": 0.45300132036209106, "regret": 0.35094013810157776, "entropy": 0.08653269708156586, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:20:01.290587Z", "loop": 2765, "env_steps": 1699430399, "loss": 0.0014719142345711589, "avg_return": 0.4573274850845337, "regret": 0.35094013810157776, "entropy": 0.0899314284324646, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:20:02.451763Z", "loop": 2766, "env_steps": 1700044799, "loss": 0.0014256936265155673, "avg_return": 0.44797253608703613, "regret": 0.35094013810157776, "entropy": 0.0843096524477005, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:20:03.614332Z", "loop": 2767, "env_steps": 1700659199, "loss": 0.0016675584483891726, "avg_return": 0.45912811160087585, "regret": 0.35094013810157776, "entropy": 0.08654704689979553, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:20:04.774515Z", "loop": 2768, "env_steps": 1701273599, "loss": 0.0016866717487573624, "avg_return": 0.4574234187602997, "regret": 0.35094013810157776, "entropy": 0.08996795117855072, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:20:05.935424Z", "loop": 2769, "env_steps": 1701887999, "loss": 0.0016066780081018806, "avg_return": 0.45203328132629395, "regret": 0.35094013810157776, "entropy": 0.09239396452903748, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:20:07.142421Z", "loop": 2770, "env_steps": 1702502399, "loss": 0.0015563199995085597, "avg_return": 0.44767558574676514, "regret": 0.35101714730262756, "entropy": 0.08970306813716888, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:20:08.304182Z", "loop": 2771, "env_steps": 1703116799, "loss": 0.0018608305836096406, "avg_return": 0.4508552551269531, "regret": 0.35101714730262756, "entropy": 0.08965334296226501, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:20:09.465539Z", "loop": 2772, "env_steps": 1703731199, "loss": 0.0016803424805402756, "avg_return": 0.45639660954475403, "regret": 0.35101714730262756, "entropy": 0.09326525032520294, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:20:10.625494Z", "loop": 2773, "env_steps": 1704345599, "loss": 0.0016936464235186577, "avg_return": 0.45885518193244934, "regret": 0.35101714730262756, "entropy": 0.08778028935194016, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:20:11.787129Z", "loop": 2774, "env_steps": 1704959999, "loss": 0.0017381813377141953, "avg_return": 0.45145657658576965, "regret": 0.35101714730262756, "entropy": 0.0929274633526802, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:20:12.947744Z", "loop": 2775, "env_steps": 1705574399, "loss": 0.0015902422601357102, "avg_return": 0.4480101764202118, "regret": 0.35101714730262756, "entropy": 0.09183699637651443, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:20:14.109328Z", "loop": 2776, "env_steps": 1706188799, "loss": 0.0015472423983737826, "avg_return": 0.45558223128318787, "regret": 0.35101714730262756, "entropy": 0.08949151635169983, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:20:15.269448Z", "loop": 2777, "env_steps": 1706803199, "loss": 0.0013466553064063191, "avg_return": 0.45818543434143066, "regret": 0.35101714730262756, "entropy": 0.08898277580738068, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:20:16.430698Z", "loop": 2778, "env_steps": 1707417599, "loss": 0.0014619574649259448, "avg_return": 0.4541698396205902, "regret": 0.35101714730262756, "entropy": 0.0893157348036766, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:20:17.591176Z", "loop": 2779, "env_steps": 1708031999, "loss": 0.0015387771418318152, "avg_return": 0.45474809408187866, "regret": 0.35101714730262756, "entropy": 0.08010110259056091, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:20:18.800129Z", "loop": 2780, "env_steps": 1708646399, "loss": 0.002080444246530533, "avg_return": 0.449921578168869, "regret": 0.35078269243240356, "entropy": 0.08445568382740021, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:20:19.961381Z", "loop": 2781, "env_steps": 1709260799, "loss": 0.0021155723370611668, "avg_return": 0.44107767939567566, "regret": 0.35078269243240356, "entropy": 0.08752456307411194, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:20:21.121993Z", "loop": 2782, "env_steps": 1709875199, "loss": 0.002500680508092046, "avg_return": 0.45064887404441833, "regret": 0.35078269243240356, "entropy": 0.08744507282972336, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:20:22.281838Z", "loop": 2783, "env_steps": 1710489599, "loss": 0.0024002210702747107, "avg_return": 0.45371633768081665, "regret": 0.35078269243240356, "entropy": 0.08281346410512924, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:20:23.442668Z", "loop": 2784, "env_steps": 1711103999, "loss": 0.0021775932982563972, "avg_return": 0.4523204267024994, "regret": 0.35078269243240356, "entropy": 0.08274564892053604, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:20:24.604736Z", "loop": 2785, "env_steps": 1711718399, "loss": 0.0027695223689079285, "avg_return": 0.45874595642089844, "regret": 0.35078269243240356, "entropy": 0.08076591044664383, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:20:25.764325Z", "loop": 2786, "env_steps": 1712332799, "loss": 0.0026499226223677397, "avg_return": 0.45008596777915955, "regret": 0.35078269243240356, "entropy": 0.08060403168201447, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:20:26.925545Z", "loop": 2787, "env_steps": 1712947199, "loss": 0.0022938738111406565, "avg_return": 0.4506649971008301, "regret": 0.35078269243240356, "entropy": 0.07787123322486877, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:20:28.086063Z", "loop": 2788, "env_steps": 1713561599, "loss": 0.0024714642204344273, "avg_return": 0.45482581853866577, "regret": 0.35078269243240356, "entropy": 0.07610038667917252, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:20:29.247279Z", "loop": 2789, "env_steps": 1714175999, "loss": 0.0022756021935492754, "avg_return": 0.45598044991493225, "regret": 0.35078269243240356, "entropy": 0.07471002638339996, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:20:30.458821Z", "loop": 2790, "env_steps": 1714790399, "loss": 0.002373384078964591, "avg_return": 0.4591600000858307, "regret": 0.3511183559894562, "entropy": 0.07624948769807816, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:20:31.619955Z", "loop": 2791, "env_steps": 1715404799, "loss": 0.0021056076511740685, "avg_return": 0.4425124228000641, "regret": 0.3511183559894562, "entropy": 0.07534001767635345, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:20:32.781470Z", "loop": 2792, "env_steps": 1716019199, "loss": 0.0025941345375031233, "avg_return": 0.45130762457847595, "regret": 0.3511183559894562, "entropy": 0.07777589559555054, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:20:33.942981Z", "loop": 2793, "env_steps": 1716633599, "loss": 0.00245799426920712, "avg_return": 0.4618508517742157, "regret": 0.3511183559894562, "entropy": 0.07351016253232956, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:20:35.103711Z", "loop": 2794, "env_steps": 1717247999, "loss": 0.002431095577776432, "avg_return": 0.45920267701148987, "regret": 0.3511183559894562, "entropy": 0.07306846231222153, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:20:36.263711Z", "loop": 2795, "env_steps": 1717862399, "loss": 0.0025471383705735207, "avg_return": 0.451160192489624, "regret": 0.3511183559894562, "entropy": 0.07824002951383591, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:20:37.424918Z", "loop": 2796, "env_steps": 1718476799, "loss": 0.0027165052015334368, "avg_return": 0.45128679275512695, "regret": 0.3511183559894562, "entropy": 0.07398978620767593, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:20:38.584818Z", "loop": 2797, "env_steps": 1719091199, "loss": 0.0027448111213743687, "avg_return": 0.4450882077217102, "regret": 0.3511183559894562, "entropy": 0.08090494573116302, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:20:39.745670Z", "loop": 2798, "env_steps": 1719705599, "loss": 0.003390207886695862, "avg_return": 0.4562479853630066, "regret": 0.3511183559894562, "entropy": 0.08821456879377365, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:20:40.907173Z", "loop": 2799, "env_steps": 1720319999, "loss": 0.003374370513483882, "avg_return": 0.451286643743515, "regret": 0.3511183559894562, "entropy": 0.09234646707773209, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:20:42.113200Z", "loop": 2800, "env_steps": 1720934399, "loss": 0.0035742854233831167, "avg_return": 0.45848262310028076, "regret": 0.3526804745197296, "entropy": 0.09182573109865189, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:20:43.276250Z", "loop": 2801, "env_steps": 1721548799, "loss": 0.0038021139334887266, "avg_return": 0.44981664419174194, "regret": 0.3526804745197296, "entropy": 0.09046893566846848, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:20:44.437794Z", "loop": 2802, "env_steps": 1722163199, "loss": 0.003293363144621253, "avg_return": 0.45225292444229126, "regret": 0.3526804745197296, "entropy": 0.08237283676862717, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:20:45.601113Z", "loop": 2803, "env_steps": 1722777599, "loss": 0.0030819193925708532, "avg_return": 0.45883607864379883, "regret": 0.3526804745197296, "entropy": 0.08248986303806305, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:20:46.762654Z", "loop": 2804, "env_steps": 1723391999, "loss": 0.0028672858607023954, "avg_return": 0.452249675989151, "regret": 0.3526804745197296, "entropy": 0.0795164629817009, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:20:47.924987Z", "loop": 2805, "env_steps": 1724006399, "loss": 0.003074735403060913, "avg_return": 0.4546073377132416, "regret": 0.3526804745197296, "entropy": 0.07857505977153778, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:20:49.087938Z", "loop": 2806, "env_steps": 1724620799, "loss": 0.0026768201496452093, "avg_return": 0.45814764499664307, "regret": 0.3526804745197296, "entropy": 0.0774109736084938, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:20:50.249237Z", "loop": 2807, "env_steps": 1725235199, "loss": 0.0022311753127723932, "avg_return": 0.45373862981796265, "regret": 0.3526804745197296, "entropy": 0.08104372769594193, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:20:51.412237Z", "loop": 2808, "env_steps": 1725849599, "loss": 0.0024336380884051323, "avg_return": 0.4536936581134796, "regret": 0.3526804745197296, "entropy": 0.07364564388990402, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:20:52.572412Z", "loop": 2809, "env_steps": 1726463999, "loss": 0.0020630634389817715, "avg_return": 0.4469214975833893, "regret": 0.3526804745197296, "entropy": 0.07146238535642624, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:20:53.776992Z", "loop": 2810, "env_steps": 1727078399, "loss": 0.0018914284883067012, "avg_return": 0.4484138488769531, "regret": 0.3508392572402954, "entropy": 0.07620861381292343, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:20:54.936272Z", "loop": 2811, "env_steps": 1727692799, "loss": 0.0018126120558008552, "avg_return": 0.4494328498840332, "regret": 0.3508392572402954, "entropy": 0.07354322075843811, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:20:56.097278Z", "loop": 2812, "env_steps": 1728307199, "loss": 0.0017872689059004188, "avg_return": 0.45474523305892944, "regret": 0.3508392572402954, "entropy": 0.07712387293577194, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:20:57.257537Z", "loop": 2813, "env_steps": 1728921599, "loss": 0.0016803890466690063, "avg_return": 0.443381667137146, "regret": 0.3508392572402954, "entropy": 0.08215998113155365, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:20:58.417876Z", "loop": 2814, "env_steps": 1729535999, "loss": 0.001903893076814711, "avg_return": 0.4560403525829315, "regret": 0.3508392572402954, "entropy": 0.07937993854284286, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:20:59.577531Z", "loop": 2815, "env_steps": 1730150399, "loss": 0.002005126792937517, "avg_return": 0.45897290110588074, "regret": 0.3508392572402954, "entropy": 0.08053261041641235, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:21:00.738382Z", "loop": 2816, "env_steps": 1730764799, "loss": 0.00190264661796391, "avg_return": 0.453474223613739, "regret": 0.3508392572402954, "entropy": 0.0843929648399353, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:21:01.904397Z", "loop": 2817, "env_steps": 1731379199, "loss": 0.002055662451311946, "avg_return": 0.45510774850845337, "regret": 0.3508392572402954, "entropy": 0.08356887102127075, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:21:03.064908Z", "loop": 2818, "env_steps": 1731993599, "loss": 0.0017080331454053521, "avg_return": 0.4465430676937103, "regret": 0.3508392572402954, "entropy": 0.08600243180990219, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:21:04.225276Z", "loop": 2819, "env_steps": 1732607999, "loss": 0.0018957607680931687, "avg_return": 0.4580303132534027, "regret": 0.3508392572402954, "entropy": 0.07889565825462341, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:21:05.433879Z", "loop": 2820, "env_steps": 1733222399, "loss": 0.001977676758542657, "avg_return": 0.44939127564430237, "regret": 0.350746750831604, "entropy": 0.08362491428852081, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:21:06.596255Z", "loop": 2821, "env_steps": 1733836799, "loss": 0.001914985477924347, "avg_return": 0.44765642285346985, "regret": 0.350746750831604, "entropy": 0.08132024854421616, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:21:07.757728Z", "loop": 2822, "env_steps": 1734451199, "loss": 0.001932598534040153, "avg_return": 0.4579913318157196, "regret": 0.350746750831604, "entropy": 0.07942549884319305, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:21:08.919530Z", "loop": 2823, "env_steps": 1735065599, "loss": 0.0018581533804535866, "avg_return": 0.4553416073322296, "regret": 0.350746750831604, "entropy": 0.07917973399162292, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:21:10.081875Z", "loop": 2824, "env_steps": 1735679999, "loss": 0.0020448844879865646, "avg_return": 0.45148155093193054, "regret": 0.350746750831604, "entropy": 0.08084297925233841, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:21:11.243628Z", "loop": 2825, "env_steps": 1736294399, "loss": 0.002236716914921999, "avg_return": 0.45293864607810974, "regret": 0.350746750831604, "entropy": 0.08058616518974304, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:21:12.406657Z", "loop": 2826, "env_steps": 1736908799, "loss": 0.0018979493761435151, "avg_return": 0.4430626928806305, "regret": 0.350746750831604, "entropy": 0.07996756583452225, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:21:13.567924Z", "loop": 2827, "env_steps": 1737523199, "loss": 0.00209123850800097, "avg_return": 0.45020055770874023, "regret": 0.350746750831604, "entropy": 0.08562258630990982, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:21:14.729297Z", "loop": 2828, "env_steps": 1738137599, "loss": 0.001872120425105095, "avg_return": 0.4435083568096161, "regret": 0.350746750831604, "entropy": 0.09063169360160828, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:21:15.892260Z", "loop": 2829, "env_steps": 1738751999, "loss": 0.001890775398351252, "avg_return": 0.45801281929016113, "regret": 0.350746750831604, "entropy": 0.08441349864006042, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:21:17.100493Z", "loop": 2830, "env_steps": 1739366399, "loss": 0.0016015165019780397, "avg_return": 0.4528053402900696, "regret": 0.35079148411750793, "entropy": 0.08232773840427399, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:21:18.263972Z", "loop": 2831, "env_steps": 1739980799, "loss": 0.0012791156768798828, "avg_return": 0.45076391100883484, "regret": 0.35079148411750793, "entropy": 0.08643078804016113, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:21:19.424972Z", "loop": 2832, "env_steps": 1740595199, "loss": 0.0011603524908423424, "avg_return": 0.45244908332824707, "regret": 0.35079148411750793, "entropy": 0.09239324182271957, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:21:20.586900Z", "loop": 2833, "env_steps": 1741209599, "loss": 0.001283879391849041, "avg_return": 0.4494701325893402, "regret": 0.35079148411750793, "entropy": 0.08532959967851639, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:21:21.747755Z", "loop": 2834, "env_steps": 1741823999, "loss": 0.0015727191930636764, "avg_return": 0.45691102743148804, "regret": 0.35079148411750793, "entropy": 0.07896482199430466, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:21:22.911866Z", "loop": 2835, "env_steps": 1742438399, "loss": 0.0017843408277258277, "avg_return": 0.4446980953216553, "regret": 0.35079148411750793, "entropy": 0.08258846402168274, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:21:24.073908Z", "loop": 2836, "env_steps": 1743052799, "loss": 0.0017351325368508697, "avg_return": 0.45510876178741455, "regret": 0.35079148411750793, "entropy": 0.08223085105419159, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:21:25.233911Z", "loop": 2837, "env_steps": 1743667199, "loss": 0.0015443677548319101, "avg_return": 0.4506971836090088, "regret": 0.35079148411750793, "entropy": 0.08620585501194, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:21:26.395347Z", "loop": 2838, "env_steps": 1744281599, "loss": 0.001374666579067707, "avg_return": 0.458234578371048, "regret": 0.35079148411750793, "entropy": 0.07684045284986496, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:21:27.557142Z", "loop": 2839, "env_steps": 1744895999, "loss": 0.0011320541379973292, "avg_return": 0.45886215567588806, "regret": 0.35079148411750793, "entropy": 0.07625116407871246, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:21:28.768278Z", "loop": 2840, "env_steps": 1745510399, "loss": 0.0007562125683762133, "avg_return": 0.44970980286598206, "regret": 0.35177189111709595, "entropy": 0.07110359519720078, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:21:29.929671Z", "loop": 2841, "env_steps": 1746124799, "loss": 0.0010163075057789683, "avg_return": 0.46101024746894836, "regret": 0.35177189111709595, "entropy": 0.07149787247180939, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:21:31.091192Z", "loop": 2842, "env_steps": 1746739199, "loss": 0.0014635025290772319, "avg_return": 0.4540489912033081, "regret": 0.35177189111709595, "entropy": 0.07649682462215424, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:21:32.252065Z", "loop": 2843, "env_steps": 1747353599, "loss": 0.0015583668136969209, "avg_return": 0.44676560163497925, "regret": 0.35177189111709595, "entropy": 0.08637592196464539, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:21:33.414976Z", "loop": 2844, "env_steps": 1747967999, "loss": 0.0020519939716905355, "avg_return": 0.45278409123420715, "regret": 0.35177189111709595, "entropy": 0.08956706523895264, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:21:34.577258Z", "loop": 2845, "env_steps": 1748582399, "loss": 0.0025532774161547422, "avg_return": 0.4520651400089264, "regret": 0.35177189111709595, "entropy": 0.09529134631156921, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:21:35.738102Z", "loop": 2846, "env_steps": 1749196799, "loss": 0.002645431784912944, "avg_return": 0.44111156463623047, "regret": 0.35177189111709595, "entropy": 0.10193751752376556, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:21:36.899859Z", "loop": 2847, "env_steps": 1749811199, "loss": 0.0029732915572822094, "avg_return": 0.4492155611515045, "regret": 0.35177189111709595, "entropy": 0.09818203002214432, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:21:38.059906Z", "loop": 2848, "env_steps": 1750425599, "loss": 0.0030438248068094254, "avg_return": 0.4424213767051697, "regret": 0.35177189111709595, "entropy": 0.10033301264047623, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:21:39.220936Z", "loop": 2849, "env_steps": 1751039999, "loss": 0.0027843068819493055, "avg_return": 0.449375718832016, "regret": 0.35177189111709595, "entropy": 0.10256164520978928, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:21:40.433731Z", "loop": 2850, "env_steps": 1751654399, "loss": 0.002940970007330179, "avg_return": 0.4560283422470093, "regret": 0.35383254289627075, "entropy": 0.09349172562360764, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:21:41.595821Z", "loop": 2851, "env_steps": 1752268799, "loss": 0.002462193835526705, "avg_return": 0.45146414637565613, "regret": 0.35383254289627075, "entropy": 0.09662420302629471, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:21:42.758158Z", "loop": 2852, "env_steps": 1752883199, "loss": 0.002158900024369359, "avg_return": 0.4523873031139374, "regret": 0.35383254289627075, "entropy": 0.09207411110401154, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:21:43.919411Z", "loop": 2853, "env_steps": 1753497599, "loss": 0.0019449252868071198, "avg_return": 0.4520038962364197, "regret": 0.35383254289627075, "entropy": 0.08738070726394653, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:21:45.080467Z", "loop": 2854, "env_steps": 1754111999, "loss": 0.001771440147422254, "avg_return": 0.45308488607406616, "regret": 0.35383254289627075, "entropy": 0.08247793465852737, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:21:46.240091Z", "loop": 2855, "env_steps": 1754726399, "loss": 0.001353682135231793, "avg_return": 0.44863831996917725, "regret": 0.35383254289627075, "entropy": 0.07670260965824127, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:21:47.400409Z", "loop": 2856, "env_steps": 1755340799, "loss": 0.0010600521927699447, "avg_return": 0.451732337474823, "regret": 0.35383254289627075, "entropy": 0.07410726696252823, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:21:48.560315Z", "loop": 2857, "env_steps": 1755955199, "loss": 0.0010183693375438452, "avg_return": 0.4512251019477844, "regret": 0.35383254289627075, "entropy": 0.0777386948466301, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:21:49.721148Z", "loop": 2858, "env_steps": 1756569599, "loss": 0.0008503393619321287, "avg_return": 0.453351765871048, "regret": 0.35383254289627075, "entropy": 0.0805756077170372, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:21:50.883675Z", "loop": 2859, "env_steps": 1757183999, "loss": 0.0011668703518807888, "avg_return": 0.45254039764404297, "regret": 0.35383254289627075, "entropy": 0.07711143791675568, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:21:52.091383Z", "loop": 2860, "env_steps": 1757798399, "loss": 0.0011362482327967882, "avg_return": 0.4494923949241638, "regret": 0.3508622646331787, "entropy": 0.08103792369365692, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:21:53.253325Z", "loop": 2861, "env_steps": 1758412799, "loss": 0.001128569943830371, "avg_return": 0.4519181549549103, "regret": 0.3508622646331787, "entropy": 0.08711504936218262, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:21:54.414055Z", "loop": 2862, "env_steps": 1759027199, "loss": 0.0014799591153860092, "avg_return": 0.45175984501838684, "regret": 0.3508622646331787, "entropy": 0.08375170081853867, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:21:55.579296Z", "loop": 2863, "env_steps": 1759641599, "loss": 0.0016005737707018852, "avg_return": 0.44404903054237366, "regret": 0.3508622646331787, "entropy": 0.09266489744186401, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:21:56.739617Z", "loop": 2864, "env_steps": 1760255999, "loss": 0.0018095466075465083, "avg_return": 0.45374470949172974, "regret": 0.3508622646331787, "entropy": 0.09489601850509644, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:21:57.900229Z", "loop": 2865, "env_steps": 1760870399, "loss": 0.0017012981697916985, "avg_return": 0.4528917670249939, "regret": 0.3508622646331787, "entropy": 0.09838090091943741, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:21:59.062298Z", "loop": 2866, "env_steps": 1761484799, "loss": 0.001990651246160269, "avg_return": 0.45688527822494507, "regret": 0.3508622646331787, "entropy": 0.09567710757255554, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:22:00.224117Z", "loop": 2867, "env_steps": 1762099199, "loss": 0.001869901898317039, "avg_return": 0.45022040605545044, "regret": 0.3508622646331787, "entropy": 0.0895751491189003, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:22:01.385927Z", "loop": 2868, "env_steps": 1762713599, "loss": 0.001998473424464464, "avg_return": 0.4587031304836273, "regret": 0.3508622646331787, "entropy": 0.08731509745121002, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:22:02.546228Z", "loop": 2869, "env_steps": 1763327999, "loss": 0.0018798512173816562, "avg_return": 0.4559081494808197, "regret": 0.3508622646331787, "entropy": 0.08894172310829163, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:22:03.755120Z", "loop": 2870, "env_steps": 1763942399, "loss": 0.00199618237093091, "avg_return": 0.4440857172012329, "regret": 0.35074758529663086, "entropy": 0.08962522447109222, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:22:04.915640Z", "loop": 2871, "env_steps": 1764556799, "loss": 0.0017244912451133132, "avg_return": 0.4542510211467743, "regret": 0.35074758529663086, "entropy": 0.09025812149047852, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:22:06.075741Z", "loop": 2872, "env_steps": 1765171199, "loss": 0.0017047967994585633, "avg_return": 0.45287182927131653, "regret": 0.35074758529663086, "entropy": 0.0884673148393631, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:22:07.234622Z", "loop": 2873, "env_steps": 1765785599, "loss": 0.0018032193183898926, "avg_return": 0.4533368945121765, "regret": 0.35074758529663086, "entropy": 0.0859004557132721, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:22:08.394300Z", "loop": 2874, "env_steps": 1766399999, "loss": 0.0016722253058105707, "avg_return": 0.45582184195518494, "regret": 0.35074758529663086, "entropy": 0.08856654167175293, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:22:09.554789Z", "loop": 2875, "env_steps": 1767014399, "loss": 0.0016997501952573657, "avg_return": 0.4429013729095459, "regret": 0.35074758529663086, "entropy": 0.09235784411430359, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:22:10.714697Z", "loop": 2876, "env_steps": 1767628799, "loss": 0.0020321307238191366, "avg_return": 0.4566517770290375, "regret": 0.35074758529663086, "entropy": 0.08779508620500565, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:22:11.875084Z", "loop": 2877, "env_steps": 1768243199, "loss": 0.0017979479162022471, "avg_return": 0.4497604966163635, "regret": 0.35074758529663086, "entropy": 0.09332351386547089, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:22:13.033789Z", "loop": 2878, "env_steps": 1768857599, "loss": 0.0017107557505369186, "avg_return": 0.4543463885784149, "regret": 0.35074758529663086, "entropy": 0.0893797054886818, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:22:14.194434Z", "loop": 2879, "env_steps": 1769471999, "loss": 0.0015915196854621172, "avg_return": 0.4510980248451233, "regret": 0.35074758529663086, "entropy": 0.08792078495025635, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:22:15.399191Z", "loop": 2880, "env_steps": 1770086399, "loss": 0.0016384873306378722, "avg_return": 0.4524373412132263, "regret": 0.35072842240333557, "entropy": 0.09001544862985611, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:22:16.561231Z", "loop": 2881, "env_steps": 1770700799, "loss": 0.0012392991920933127, "avg_return": 0.45258936285972595, "regret": 0.35072842240333557, "entropy": 0.08800751715898514, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:22:17.721644Z", "loop": 2882, "env_steps": 1771315199, "loss": 0.0010783803882077336, "avg_return": 0.4484677314758301, "regret": 0.35072842240333557, "entropy": 0.08347102999687195, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:22:18.883080Z", "loop": 2883, "env_steps": 1771929599, "loss": 0.0009712693281471729, "avg_return": 0.45172119140625, "regret": 0.35072842240333557, "entropy": 0.07888910919427872, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:22:20.043393Z", "loop": 2884, "env_steps": 1772543999, "loss": 0.0009986086515709758, "avg_return": 0.4493285119533539, "regret": 0.35072842240333557, "entropy": 0.07976923137903214, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:22:21.204641Z", "loop": 2885, "env_steps": 1773158399, "loss": 0.0013198998058214784, "avg_return": 0.45396214723587036, "regret": 0.35072842240333557, "entropy": 0.08570089936256409, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:22:22.366610Z", "loop": 2886, "env_steps": 1773772799, "loss": 0.0014606408076360822, "avg_return": 0.4472174048423767, "regret": 0.35072842240333557, "entropy": 0.08670558035373688, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:22:23.527265Z", "loop": 2887, "env_steps": 1774387199, "loss": 0.001616406487300992, "avg_return": 0.45518383383750916, "regret": 0.35072842240333557, "entropy": 0.09098353981971741, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:22:24.688695Z", "loop": 2888, "env_steps": 1775001599, "loss": 0.0018752707401290536, "avg_return": 0.45427730679512024, "regret": 0.35072842240333557, "entropy": 0.0914786234498024, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:22:25.848949Z", "loop": 2889, "env_steps": 1775615999, "loss": 0.0016445210203528404, "avg_return": 0.4520251452922821, "regret": 0.35072842240333557, "entropy": 0.09530183672904968, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:22:27.059100Z", "loop": 2890, "env_steps": 1776230399, "loss": 0.0017264260677620769, "avg_return": 0.452182412147522, "regret": 0.3513568937778473, "entropy": 0.08893786370754242, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:22:28.219578Z", "loop": 2891, "env_steps": 1776844799, "loss": 0.0017791008576750755, "avg_return": 0.45604950189590454, "regret": 0.3513568937778473, "entropy": 0.09227674454450607, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:22:29.381977Z", "loop": 2892, "env_steps": 1777459199, "loss": 0.0018527640495449305, "avg_return": 0.45469900965690613, "regret": 0.3513568937778473, "entropy": 0.09193821251392365, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:22:30.542692Z", "loop": 2893, "env_steps": 1778073599, "loss": 0.0016052213031798601, "avg_return": 0.4506046772003174, "regret": 0.3513568937778473, "entropy": 0.0912574827671051, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:22:31.704555Z", "loop": 2894, "env_steps": 1778687999, "loss": 0.0020214191172271967, "avg_return": 0.4515639841556549, "regret": 0.3513568937778473, "entropy": 0.09008710086345673, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:22:32.867350Z", "loop": 2895, "env_steps": 1779302399, "loss": 0.0015777783701196313, "avg_return": 0.45759934186935425, "regret": 0.3513568937778473, "entropy": 0.0869988352060318, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:22:34.028385Z", "loop": 2896, "env_steps": 1779916799, "loss": 0.001493964227847755, "avg_return": 0.4604322016239166, "regret": 0.3513568937778473, "entropy": 0.07833972573280334, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:22:35.190489Z", "loop": 2897, "env_steps": 1780531199, "loss": 0.001069326652213931, "avg_return": 0.4480128586292267, "regret": 0.3513568937778473, "entropy": 0.08203244209289551, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:22:36.351236Z", "loop": 2898, "env_steps": 1781145599, "loss": 0.0010480487253516912, "avg_return": 0.44768083095550537, "regret": 0.3513568937778473, "entropy": 0.07772714644670486, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:22:37.512669Z", "loop": 2899, "env_steps": 1781759999, "loss": 0.0008554297382943332, "avg_return": 0.45410969853401184, "regret": 0.3513568937778473, "entropy": 0.0779692679643631, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:22:38.731107Z", "loop": 2900, "env_steps": 1782374399, "loss": 0.0008706498192623258, "avg_return": 0.4525069296360016, "regret": 0.35106518864631653, "entropy": 0.07807008922100067, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:22:39.891916Z", "loop": 2901, "env_steps": 1782988799, "loss": 0.0008855749038048089, "avg_return": 0.4526904821395874, "regret": 0.35106518864631653, "entropy": 0.07623377442359924, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:22:41.052788Z", "loop": 2902, "env_steps": 1783603199, "loss": 0.0008458485826849937, "avg_return": 0.4571368396282196, "regret": 0.35106518864631653, "entropy": 0.07702125608921051, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:22:42.213116Z", "loop": 2903, "env_steps": 1784217599, "loss": 0.0009420771966688335, "avg_return": 0.45354706048965454, "regret": 0.35106518864631653, "entropy": 0.07642904669046402, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:22:43.375176Z", "loop": 2904, "env_steps": 1784831999, "loss": 0.000792207196354866, "avg_return": 0.4475630223751068, "regret": 0.35106518864631653, "entropy": 0.08171943575143814, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:22:44.536845Z", "loop": 2905, "env_steps": 1785446399, "loss": 0.0009029737557284534, "avg_return": 0.45336732268333435, "regret": 0.35106518864631653, "entropy": 0.07662900537252426, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:22:45.698742Z", "loop": 2906, "env_steps": 1786060799, "loss": 0.000788115372415632, "avg_return": 0.45497560501098633, "regret": 0.35106518864631653, "entropy": 0.07997716963291168, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:22:46.860905Z", "loop": 2907, "env_steps": 1786675199, "loss": 0.0007903423975221813, "avg_return": 0.4522474408149719, "regret": 0.35106518864631653, "entropy": 0.07877789437770844, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:22:48.022171Z", "loop": 2908, "env_steps": 1787289599, "loss": 0.0008993893279694021, "avg_return": 0.4541604816913605, "regret": 0.35106518864631653, "entropy": 0.07803074270486832, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:22:49.183497Z", "loop": 2909, "env_steps": 1787903999, "loss": 0.001056505716405809, "avg_return": 0.45471081137657166, "regret": 0.35106518864631653, "entropy": 0.08125942945480347, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:22:50.397935Z", "loop": 2910, "env_steps": 1788518399, "loss": 0.0011576464166864753, "avg_return": 0.45976948738098145, "regret": 0.3507879376411438, "entropy": 0.08496467769145966, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:22:51.559044Z", "loop": 2911, "env_steps": 1789132799, "loss": 0.0011220283340662718, "avg_return": 0.4522366523742676, "regret": 0.3507879376411438, "entropy": 0.08238708972930908, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:22:52.717948Z", "loop": 2912, "env_steps": 1789747199, "loss": 0.0012017663102596998, "avg_return": 0.4442024827003479, "regret": 0.3507879376411438, "entropy": 0.08354192227125168, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:22:53.879065Z", "loop": 2913, "env_steps": 1790361599, "loss": 0.0014392771990969777, "avg_return": 0.46176403760910034, "regret": 0.3507879376411438, "entropy": 0.08063477277755737, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:22:55.040103Z", "loop": 2914, "env_steps": 1790975999, "loss": 0.0013492516009137034, "avg_return": 0.45263051986694336, "regret": 0.3507879376411438, "entropy": 0.0940045714378357, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:22:56.200337Z", "loop": 2915, "env_steps": 1791590399, "loss": 0.0016438417369499803, "avg_return": 0.4556114673614502, "regret": 0.3507879376411438, "entropy": 0.08575904369354248, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:22:57.361753Z", "loop": 2916, "env_steps": 1792204799, "loss": 0.0016760770231485367, "avg_return": 0.4530108869075775, "regret": 0.3507879376411438, "entropy": 0.08989691734313965, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:22:58.521636Z", "loop": 2917, "env_steps": 1792819199, "loss": 0.0015088430372998118, "avg_return": 0.4568724036216736, "regret": 0.3507879376411438, "entropy": 0.09194043278694153, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:22:59.687436Z", "loop": 2918, "env_steps": 1793433599, "loss": 0.0019495170563459396, "avg_return": 0.46099385619163513, "regret": 0.3507879376411438, "entropy": 0.08931954950094223, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:23:00.849896Z", "loop": 2919, "env_steps": 1794047999, "loss": 0.0017041809624060988, "avg_return": 0.45688533782958984, "regret": 0.3507879376411438, "entropy": 0.09405932575464249, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:23:02.062398Z", "loop": 2920, "env_steps": 1794662399, "loss": 0.0020413463935256004, "avg_return": 0.45508870482444763, "regret": 0.35071223974227905, "entropy": 0.09343831986188889, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:23:03.225015Z", "loop": 2921, "env_steps": 1795276799, "loss": 0.0018412228673696518, "avg_return": 0.4505622088909149, "regret": 0.35071223974227905, "entropy": 0.09230517596006393, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:23:04.389069Z", "loop": 2922, "env_steps": 1795891199, "loss": 0.0016102103982120752, "avg_return": 0.44300028681755066, "regret": 0.35071223974227905, "entropy": 0.09163589030504227, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:23:05.550762Z", "loop": 2923, "env_steps": 1796505599, "loss": 0.0017023783875629306, "avg_return": 0.44860923290252686, "regret": 0.35071223974227905, "entropy": 0.09106242656707764, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:23:06.710635Z", "loop": 2924, "env_steps": 1797119999, "loss": 0.0019038928439840674, "avg_return": 0.4462570250034332, "regret": 0.35071223974227905, "entropy": 0.0844946950674057, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:23:07.872184Z", "loop": 2925, "env_steps": 1797734399, "loss": 0.0017230281373485923, "avg_return": 0.45461589097976685, "regret": 0.35071223974227905, "entropy": 0.08500111848115921, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:23:09.031866Z", "loop": 2926, "env_steps": 1798348799, "loss": 0.002013634890317917, "avg_return": 0.4526553452014923, "regret": 0.35071223974227905, "entropy": 0.08552870154380798, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:23:10.191390Z", "loop": 2927, "env_steps": 1798963199, "loss": 0.0027658462058752775, "avg_return": 0.4576667249202728, "regret": 0.35071223974227905, "entropy": 0.085819773375988, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:23:11.352619Z", "loop": 2928, "env_steps": 1799577599, "loss": 0.00276132277213037, "avg_return": 0.44636693596839905, "regret": 0.35071223974227905, "entropy": 0.0833398625254631, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:23:12.512527Z", "loop": 2929, "env_steps": 1800191999, "loss": 0.0029776524752378464, "avg_return": 0.45193493366241455, "regret": 0.35071223974227905, "entropy": 0.08164750039577484, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:23:13.717140Z", "loop": 2930, "env_steps": 1800806399, "loss": 0.0034394629765301943, "avg_return": 0.45151346921920776, "regret": 0.35226067900657654, "entropy": 0.08779057115316391, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:23:14.879686Z", "loop": 2931, "env_steps": 1801420799, "loss": 0.003732046578079462, "avg_return": 0.44806286692619324, "regret": 0.35226067900657654, "entropy": 0.09660470485687256, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:23:16.041301Z", "loop": 2932, "env_steps": 1802035199, "loss": 0.0037737686652690172, "avg_return": 0.4429470896720886, "regret": 0.35226067900657654, "entropy": 0.09556354582309723, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:23:17.201822Z", "loop": 2933, "env_steps": 1802649599, "loss": 0.0033933629747480154, "avg_return": 0.4445938766002655, "regret": 0.35226067900657654, "entropy": 0.0955401360988617, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:23:18.363962Z", "loop": 2934, "env_steps": 1803263999, "loss": 0.0034075737930834293, "avg_return": 0.4451432526111603, "regret": 0.35226067900657654, "entropy": 0.09410405904054642, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:23:19.527471Z", "loop": 2935, "env_steps": 1803878399, "loss": 0.0028644250705838203, "avg_return": 0.45083874464035034, "regret": 0.35226067900657654, "entropy": 0.0880933552980423, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:23:20.688301Z", "loop": 2936, "env_steps": 1804492799, "loss": 0.0031469014938920736, "avg_return": 0.4529435336589813, "regret": 0.35226067900657654, "entropy": 0.08724746853113174, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:23:21.849326Z", "loop": 2937, "env_steps": 1805107199, "loss": 0.002935571363195777, "avg_return": 0.4548394978046417, "regret": 0.35226067900657654, "entropy": 0.08410836011171341, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:23:23.010187Z", "loop": 2938, "env_steps": 1805721599, "loss": 0.0029098347295075655, "avg_return": 0.45089244842529297, "regret": 0.35226067900657654, "entropy": 0.08333800733089447, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:23:24.172868Z", "loop": 2939, "env_steps": 1806335999, "loss": 0.002452131826430559, "avg_return": 0.44417303800582886, "regret": 0.35226067900657654, "entropy": 0.07835216075181961, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:23:25.381301Z", "loop": 2940, "env_steps": 1806950399, "loss": 0.002494312124326825, "avg_return": 0.4417479634284973, "regret": 0.35646703839302063, "entropy": 0.07526230067014694, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:23:26.542277Z", "loop": 2941, "env_steps": 1807564799, "loss": 0.0025525186210870743, "avg_return": 0.4507552683353424, "regret": 0.35646703839302063, "entropy": 0.07473280280828476, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:23:27.702574Z", "loop": 2942, "env_steps": 1808179199, "loss": 0.002582552609965205, "avg_return": 0.4484367072582245, "regret": 0.35646703839302063, "entropy": 0.07749227434396744, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:23:28.865733Z", "loop": 2943, "env_steps": 1808793599, "loss": 0.0025356567930430174, "avg_return": 0.45444580912590027, "regret": 0.35646703839302063, "entropy": 0.07614773511886597, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:23:30.028522Z", "loop": 2944, "env_steps": 1809407999, "loss": 0.0022333026863634586, "avg_return": 0.4481964111328125, "regret": 0.35646703839302063, "entropy": 0.0707358717918396, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:23:31.189132Z", "loop": 2945, "env_steps": 1810022399, "loss": 0.0025458810850977898, "avg_return": 0.4506783187389374, "regret": 0.35646703839302063, "entropy": 0.07324281334877014, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:23:32.350608Z", "loop": 2946, "env_steps": 1810636799, "loss": 0.0026691972743719816, "avg_return": 0.4535888135433197, "regret": 0.35646703839302063, "entropy": 0.07202862203121185, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:23:33.510640Z", "loop": 2947, "env_steps": 1811251199, "loss": 0.0029059459920972586, "avg_return": 0.446616530418396, "regret": 0.35646703839302063, "entropy": 0.07630319148302078, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:23:34.672364Z", "loop": 2948, "env_steps": 1811865599, "loss": 0.002776632085442543, "avg_return": 0.44824856519699097, "regret": 0.35646703839302063, "entropy": 0.07380595803260803, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:23:35.832686Z", "loop": 2949, "env_steps": 1812479999, "loss": 0.0029873766470700502, "avg_return": 0.44699469208717346, "regret": 0.35646703839302063, "entropy": 0.07888983935117722, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:23:37.038638Z", "loop": 2950, "env_steps": 1813094399, "loss": 0.0031889763195067644, "avg_return": 0.45620986819267273, "regret": 0.35110077261924744, "entropy": 0.08022776246070862, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:23:38.199421Z", "loop": 2951, "env_steps": 1813708799, "loss": 0.003297040006145835, "avg_return": 0.4554923474788666, "regret": 0.35110077261924744, "entropy": 0.0840940922498703, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:23:39.361853Z", "loop": 2952, "env_steps": 1814323199, "loss": 0.003101702779531479, "avg_return": 0.45204102993011475, "regret": 0.35110077261924744, "entropy": 0.0838802382349968, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:23:40.523132Z", "loop": 2953, "env_steps": 1814937599, "loss": 0.0029923166148364544, "avg_return": 0.44955164194107056, "regret": 0.35110077261924744, "entropy": 0.08079702407121658, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:23:41.684471Z", "loop": 2954, "env_steps": 1815551999, "loss": 0.0027856265660375357, "avg_return": 0.45300284028053284, "regret": 0.35110077261924744, "entropy": 0.07182794064283371, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:23:42.846822Z", "loop": 2955, "env_steps": 1816166399, "loss": 0.002277877414599061, "avg_return": 0.4545421600341797, "regret": 0.35110077261924744, "entropy": 0.06371871381998062, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:23:44.007465Z", "loop": 2956, "env_steps": 1816780799, "loss": 0.0022463572677224874, "avg_return": 0.4540626108646393, "regret": 0.35110077261924744, "entropy": 0.06155679002404213, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:23:45.169457Z", "loop": 2957, "env_steps": 1817395199, "loss": 0.0020211879163980484, "avg_return": 0.45334845781326294, "regret": 0.35110077261924744, "entropy": 0.0612485446035862, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:23:46.329989Z", "loop": 2958, "env_steps": 1818009599, "loss": 0.0021769441664218903, "avg_return": 0.44956398010253906, "regret": 0.35110077261924744, "entropy": 0.0603264756500721, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:23:47.491111Z", "loop": 2959, "env_steps": 1818623999, "loss": 0.0017344144871458411, "avg_return": 0.4509061872959137, "regret": 0.35110077261924744, "entropy": 0.05845123901963234, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:23:48.696618Z", "loop": 2960, "env_steps": 1819238399, "loss": 0.0017184989992529154, "avg_return": 0.4504580795764923, "regret": 0.3513897955417633, "entropy": 0.05746699869632721, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:23:49.859273Z", "loop": 2961, "env_steps": 1819852799, "loss": 0.0016716236714273691, "avg_return": 0.4510078430175781, "regret": 0.3513897955417633, "entropy": 0.05775480717420578, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:23:51.019430Z", "loop": 2962, "env_steps": 1820467199, "loss": 0.0015594344586133957, "avg_return": 0.4552099108695984, "regret": 0.3513897955417633, "entropy": 0.0544365756213665, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:23:52.180387Z", "loop": 2963, "env_steps": 1821081599, "loss": 0.0016032559797167778, "avg_return": 0.4562947750091553, "regret": 0.3513897955417633, "entropy": 0.057064592838287354, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:23:53.341815Z", "loop": 2964, "env_steps": 1821695999, "loss": 0.001642028451897204, "avg_return": 0.45118948817253113, "regret": 0.3513897955417633, "entropy": 0.05622867867350578, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:23:54.502457Z", "loop": 2965, "env_steps": 1822310399, "loss": 0.0017910925671458244, "avg_return": 0.4531175196170807, "regret": 0.3513897955417633, "entropy": 0.06079104170203209, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:23:55.666756Z", "loop": 2966, "env_steps": 1822924799, "loss": 0.0018574355635792017, "avg_return": 0.4508197009563446, "regret": 0.3513897955417633, "entropy": 0.06093937158584595, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:23:56.826912Z", "loop": 2967, "env_steps": 1823539199, "loss": 0.001960343448445201, "avg_return": 0.4482370615005493, "regret": 0.3513897955417633, "entropy": 0.062383782118558884, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:23:57.987180Z", "loop": 2968, "env_steps": 1824153599, "loss": 0.0021246394608169794, "avg_return": 0.45840078592300415, "regret": 0.3513897955417633, "entropy": 0.06356601417064667, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:23:59.149119Z", "loop": 2969, "env_steps": 1824767999, "loss": 0.0022658787202090025, "avg_return": 0.4470694661140442, "regret": 0.3513897955417633, "entropy": 0.061913978308439255, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:24:00.358896Z", "loop": 2970, "env_steps": 1825382399, "loss": 0.001776580698788166, "avg_return": 0.45336630940437317, "regret": 0.35119184851646423, "entropy": 0.0593230277299881, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:24:01.521323Z", "loop": 2971, "env_steps": 1825996799, "loss": 0.0016900617629289627, "avg_return": 0.45587921142578125, "regret": 0.35119184851646423, "entropy": 0.05830540880560875, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:24:02.682655Z", "loop": 2972, "env_steps": 1826611199, "loss": 0.0014682277105748653, "avg_return": 0.4415680170059204, "regret": 0.35119184851646423, "entropy": 0.05880757421255112, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:24:03.844074Z", "loop": 2973, "env_steps": 1827225599, "loss": 0.0014483658596873283, "avg_return": 0.4598863422870636, "regret": 0.35119184851646423, "entropy": 0.05686911940574646, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:24:05.005174Z", "loop": 2974, "env_steps": 1827839999, "loss": 0.0015048504574224353, "avg_return": 0.45457398891448975, "regret": 0.35119184851646423, "entropy": 0.05648022145032883, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:24:06.168470Z", "loop": 2975, "env_steps": 1828454399, "loss": 0.0016032581916078925, "avg_return": 0.453888863325119, "regret": 0.35119184851646423, "entropy": 0.05241324007511139, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:24:07.328816Z", "loop": 2976, "env_steps": 1829068799, "loss": 0.0014161014696583152, "avg_return": 0.4475647211074829, "regret": 0.35119184851646423, "entropy": 0.0561327300965786, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:24:08.490385Z", "loop": 2977, "env_steps": 1829683199, "loss": 0.001540933852083981, "avg_return": 0.44565725326538086, "regret": 0.35119184851646423, "entropy": 0.05541769787669182, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:24:09.652694Z", "loop": 2978, "env_steps": 1830297599, "loss": 0.001813650131225586, "avg_return": 0.453904390335083, "regret": 0.35119184851646423, "entropy": 0.059116072952747345, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:24:10.814188Z", "loop": 2979, "env_steps": 1830911999, "loss": 0.0017825972754508257, "avg_return": 0.44543367624282837, "regret": 0.35119184851646423, "entropy": 0.06120959296822548, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:24:12.031690Z", "loop": 2980, "env_steps": 1831526399, "loss": 0.002211095066741109, "avg_return": 0.45776596665382385, "regret": 0.35111960768699646, "entropy": 0.06215539947152138, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:24:13.200141Z", "loop": 2981, "env_steps": 1832140799, "loss": 0.0020950871985405684, "avg_return": 0.4566044211387634, "regret": 0.35111960768699646, "entropy": 0.063201405107975, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:24:14.360633Z", "loop": 2982, "env_steps": 1832755199, "loss": 0.002395190065726638, "avg_return": 0.4481407403945923, "regret": 0.35111960768699646, "entropy": 0.06633168458938599, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:24:15.522028Z", "loop": 2983, "env_steps": 1833369599, "loss": 0.0024568436201661825, "avg_return": 0.45457327365875244, "regret": 0.35111960768699646, "entropy": 0.07045713067054749, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:24:16.682585Z", "loop": 2984, "env_steps": 1833983999, "loss": 0.002483097603544593, "avg_return": 0.4567388594150543, "regret": 0.35111960768699646, "entropy": 0.07178633660078049, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:24:17.843643Z", "loop": 2985, "env_steps": 1834598399, "loss": 0.002519328612834215, "avg_return": 0.4447158873081207, "regret": 0.35111960768699646, "entropy": 0.07715659588575363, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:24:19.003640Z", "loop": 2986, "env_steps": 1835212799, "loss": 0.0026445346884429455, "avg_return": 0.4541315734386444, "regret": 0.35111960768699646, "entropy": 0.07802511006593704, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:24:20.163829Z", "loop": 2987, "env_steps": 1835827199, "loss": 0.002599921775981784, "avg_return": 0.4507862329483032, "regret": 0.35111960768699646, "entropy": 0.08298169076442719, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:24:21.323073Z", "loop": 2988, "env_steps": 1836441599, "loss": 0.0026105802971869707, "avg_return": 0.4503466486930847, "regret": 0.35111960768699646, "entropy": 0.07771794497966766, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:24:22.482643Z", "loop": 2989, "env_steps": 1837055999, "loss": 0.0028643307741731405, "avg_return": 0.46075257658958435, "regret": 0.35111960768699646, "entropy": 0.0795619860291481, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:24:23.688147Z", "loop": 2990, "env_steps": 1837670399, "loss": 0.0027244153898209333, "avg_return": 0.4514506161212921, "regret": 0.3511074483394623, "entropy": 0.08373723924160004, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:24:24.852323Z", "loop": 2991, "env_steps": 1838284799, "loss": 0.002658177400007844, "avg_return": 0.45224860310554504, "regret": 0.3511074483394623, "entropy": 0.08268836885690689, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:24:26.013807Z", "loop": 2992, "env_steps": 1838899199, "loss": 0.0021095050033181906, "avg_return": 0.4530777633190155, "regret": 0.3511074483394623, "entropy": 0.08015169203281403, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:24:27.174477Z", "loop": 2993, "env_steps": 1839513599, "loss": 0.0016280477866530418, "avg_return": 0.4544978439807892, "regret": 0.3511074483394623, "entropy": 0.08050279319286346, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:24:28.335787Z", "loop": 2994, "env_steps": 1840127999, "loss": 0.0015984801575541496, "avg_return": 0.45539531111717224, "regret": 0.3511074483394623, "entropy": 0.07676905393600464, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:24:29.495423Z", "loop": 2995, "env_steps": 1840742399, "loss": 0.0016063572838902473, "avg_return": 0.45196402072906494, "regret": 0.3511074483394623, "entropy": 0.07942496985197067, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:24:30.656354Z", "loop": 2996, "env_steps": 1841356799, "loss": 0.0010657055536285043, "avg_return": 0.4458952844142914, "regret": 0.3511074483394623, "entropy": 0.08157603442668915, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:24:31.817129Z", "loop": 2997, "env_steps": 1841971199, "loss": 0.0013570516603067517, "avg_return": 0.4507032334804535, "regret": 0.3511074483394623, "entropy": 0.08018160611391068, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:24:32.977458Z", "loop": 2998, "env_steps": 1842585599, "loss": 0.0015827510505914688, "avg_return": 0.456182062625885, "regret": 0.3511074483394623, "entropy": 0.08124767243862152, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:24:34.137246Z", "loop": 2999, "env_steps": 1843199999, "loss": 0.0016839553136378527, "avg_return": 0.45108985900878906, "regret": 0.3511074483394623, "entropy": 0.08232078701257706, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:24:35.339788Z", "loop": 3000, "env_steps": 1843814399, "loss": 0.0013333514798432589, "avg_return": 0.4473927915096283, "regret": 0.3529910445213318, "entropy": 0.08453943580389023, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:24:36.500700Z", "loop": 3001, "env_steps": 1844428799, "loss": 0.001307381084188819, "avg_return": 0.4498847424983978, "regret": 0.3529910445213318, "entropy": 0.08489494770765305, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:24:37.660954Z", "loop": 3002, "env_steps": 1845043199, "loss": 0.0011554057709872723, "avg_return": 0.4428565502166748, "regret": 0.3529910445213318, "entropy": 0.08552063256502151, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:24:38.820528Z", "loop": 3003, "env_steps": 1845657599, "loss": 0.0011960986303165555, "avg_return": 0.4527931809425354, "regret": 0.3529910445213318, "entropy": 0.081667959690094, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:24:39.981692Z", "loop": 3004, "env_steps": 1846271999, "loss": 0.0010406248038634658, "avg_return": 0.4489990472793579, "regret": 0.3529910445213318, "entropy": 0.07922118902206421, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:24:41.143083Z", "loop": 3005, "env_steps": 1846886399, "loss": 0.0009120468166656792, "avg_return": 0.45819541811943054, "regret": 0.3529910445213318, "entropy": 0.07623109221458435, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:24:42.303727Z", "loop": 3006, "env_steps": 1847500799, "loss": 0.0007880114135332406, "avg_return": 0.44412437081336975, "regret": 0.3529910445213318, "entropy": 0.06895754486322403, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:24:43.464990Z", "loop": 3007, "env_steps": 1848115199, "loss": 0.000647961103823036, "avg_return": 0.45717620849609375, "regret": 0.3529910445213318, "entropy": 0.07297179102897644, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:24:44.625371Z", "loop": 3008, "env_steps": 1848729599, "loss": 0.0007675024098716676, "avg_return": 0.4546296298503876, "regret": 0.3529910445213318, "entropy": 0.0684259831905365, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:24:45.785800Z", "loop": 3009, "env_steps": 1849343999, "loss": 0.0009402590803802013, "avg_return": 0.4547038972377777, "regret": 0.3529910445213318, "entropy": 0.06547819823026657, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:24:46.997412Z", "loop": 3010, "env_steps": 1849958399, "loss": 0.0011040841927751899, "avg_return": 0.45056548714637756, "regret": 0.352972149848938, "entropy": 0.0761607214808464, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:24:48.165312Z", "loop": 3011, "env_steps": 1850572799, "loss": 0.0012132819974794984, "avg_return": 0.45471400022506714, "regret": 0.352972149848938, "entropy": 0.07277011126279831, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:24:49.327446Z", "loop": 3012, "env_steps": 1851187199, "loss": 0.0013702254509553313, "avg_return": 0.4509914219379425, "regret": 0.352972149848938, "entropy": 0.07443541288375854, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:24:50.490404Z", "loop": 3013, "env_steps": 1851801599, "loss": 0.0012904915492981672, "avg_return": 0.44145509600639343, "regret": 0.352972149848938, "entropy": 0.07591745257377625, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:24:51.652421Z", "loop": 3014, "env_steps": 1852415999, "loss": 0.0014650608645752072, "avg_return": 0.45653286576271057, "regret": 0.352972149848938, "entropy": 0.06976573914289474, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:24:52.815715Z", "loop": 3015, "env_steps": 1853030399, "loss": 0.0015129041858017445, "avg_return": 0.4520183503627777, "regret": 0.352972149848938, "entropy": 0.06945867091417313, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:24:53.977487Z", "loop": 3016, "env_steps": 1853644799, "loss": 0.0013629997847601771, "avg_return": 0.4559554159641266, "regret": 0.352972149848938, "entropy": 0.07387187331914902, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:24:55.140086Z", "loop": 3017, "env_steps": 1854259199, "loss": 0.0012957712169736624, "avg_return": 0.4585091769695282, "regret": 0.352972149848938, "entropy": 0.06849925220012665, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:24:56.305031Z", "loop": 3018, "env_steps": 1854873599, "loss": 0.0012774837668985128, "avg_return": 0.4484233856201172, "regret": 0.352972149848938, "entropy": 0.07077532261610031, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:24:57.467106Z", "loop": 3019, "env_steps": 1855487999, "loss": 0.0014914635103195906, "avg_return": 0.4534478783607483, "regret": 0.352972149848938, "entropy": 0.0704190731048584, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:24:58.681001Z", "loop": 3020, "env_steps": 1856102399, "loss": 0.0014268714003264904, "avg_return": 0.448849081993103, "regret": 0.35198983550071716, "entropy": 0.07066631317138672, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:24:59.842295Z", "loop": 3021, "env_steps": 1856716799, "loss": 0.0014398768544197083, "avg_return": 0.4538390636444092, "regret": 0.35198983550071716, "entropy": 0.07032706588506699, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:25:01.004161Z", "loop": 3022, "env_steps": 1857331199, "loss": 0.0013053336879238486, "avg_return": 0.4532323181629181, "regret": 0.35198983550071716, "entropy": 0.07222449034452438, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:25:02.165251Z", "loop": 3023, "env_steps": 1857945599, "loss": 0.0012643050868064165, "avg_return": 0.46156683564186096, "regret": 0.35198983550071716, "entropy": 0.07298066467046738, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:25:03.327317Z", "loop": 3024, "env_steps": 1858559999, "loss": 0.0010307102929800749, "avg_return": 0.4525398313999176, "regret": 0.35198983550071716, "entropy": 0.07396656274795532, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:25:04.487476Z", "loop": 3025, "env_steps": 1859174399, "loss": 0.0011906985891982913, "avg_return": 0.4623064398765564, "regret": 0.35198983550071716, "entropy": 0.07339838147163391, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:25:05.648007Z", "loop": 3026, "env_steps": 1859788799, "loss": 0.001065633143298328, "avg_return": 0.45775142312049866, "regret": 0.35198983550071716, "entropy": 0.07901636511087418, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:25:06.809658Z", "loop": 3027, "env_steps": 1860403199, "loss": 0.0009324480779469013, "avg_return": 0.4571332335472107, "regret": 0.35198983550071716, "entropy": 0.07692674547433853, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:25:07.969904Z", "loop": 3028, "env_steps": 1861017599, "loss": 0.0010777569841593504, "avg_return": 0.4512384235858917, "regret": 0.35198983550071716, "entropy": 0.07610466331243515, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:25:09.132608Z", "loop": 3029, "env_steps": 1861631999, "loss": 0.001061189454048872, "avg_return": 0.4506373107433319, "regret": 0.35198983550071716, "entropy": 0.08140775561332703, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:25:10.337961Z", "loop": 3030, "env_steps": 1862246399, "loss": 0.0010043449001386762, "avg_return": 0.4603835642337799, "regret": 0.35071849822998047, "entropy": 0.07489477843046188, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:25:11.499712Z", "loop": 3031, "env_steps": 1862860799, "loss": 0.0009757971274666488, "avg_return": 0.45333221554756165, "regret": 0.35071849822998047, "entropy": 0.07519668340682983, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:25:12.660228Z", "loop": 3032, "env_steps": 1863475199, "loss": 0.0010376967256888747, "avg_return": 0.45208486914634705, "regret": 0.35071849822998047, "entropy": 0.07896462827920914, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:25:13.821369Z", "loop": 3033, "env_steps": 1864089599, "loss": 0.001120847649872303, "avg_return": 0.457027792930603, "regret": 0.35071849822998047, "entropy": 0.07530737668275833, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:25:14.980914Z", "loop": 3034, "env_steps": 1864703999, "loss": 0.0012165697989985347, "avg_return": 0.44827720522880554, "regret": 0.35071849822998047, "entropy": 0.08152617514133453, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:25:16.141933Z", "loop": 3035, "env_steps": 1865318399, "loss": 0.0010744563769549131, "avg_return": 0.45526906847953796, "regret": 0.35071849822998047, "entropy": 0.07836005091667175, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:25:17.302716Z", "loop": 3036, "env_steps": 1865932799, "loss": 0.0012839878909289837, "avg_return": 0.45275336503982544, "regret": 0.35071849822998047, "entropy": 0.08010486513376236, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:25:18.462830Z", "loop": 3037, "env_steps": 1866547199, "loss": 0.0012794245267286897, "avg_return": 0.4492853283882141, "regret": 0.35071849822998047, "entropy": 0.08805138617753983, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:25:19.623984Z", "loop": 3038, "env_steps": 1867161599, "loss": 0.0014069200260564685, "avg_return": 0.44756004214286804, "regret": 0.35071849822998047, "entropy": 0.09235245734453201, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:25:20.784651Z", "loop": 3039, "env_steps": 1867775999, "loss": 0.00163117831107229, "avg_return": 0.4492524266242981, "regret": 0.35071849822998047, "entropy": 0.08519035577774048, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:25:21.990181Z", "loop": 3040, "env_steps": 1868390399, "loss": 0.0016026431694626808, "avg_return": 0.4473447799682617, "regret": 0.3506644070148468, "entropy": 0.08762083202600479, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:25:23.151128Z", "loop": 3041, "env_steps": 1869004799, "loss": 0.001619274728000164, "avg_return": 0.46362200379371643, "regret": 0.3506644070148468, "entropy": 0.08973190188407898, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:25:24.312781Z", "loop": 3042, "env_steps": 1869619199, "loss": 0.001539183547720313, "avg_return": 0.45123881101608276, "regret": 0.3506644070148468, "entropy": 0.09138047695159912, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:25:25.476228Z", "loop": 3043, "env_steps": 1870233599, "loss": 0.001769659691490233, "avg_return": 0.44583407044410706, "regret": 0.3506644070148468, "entropy": 0.09828345477581024, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:25:26.637917Z", "loop": 3044, "env_steps": 1870847999, "loss": 0.0017614354146644473, "avg_return": 0.45784303545951843, "regret": 0.3506644070148468, "entropy": 0.09553276747465134, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:25:27.798639Z", "loop": 3045, "env_steps": 1871462399, "loss": 0.0016445362707599998, "avg_return": 0.45628073811531067, "regret": 0.3506644070148468, "entropy": 0.08800681680440903, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:25:28.959292Z", "loop": 3046, "env_steps": 1872076799, "loss": 0.002037155209109187, "avg_return": 0.4571210443973541, "regret": 0.3506644070148468, "entropy": 0.09443666785955429, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:25:30.121785Z", "loop": 3047, "env_steps": 1872691199, "loss": 0.0018024108139798045, "avg_return": 0.4558386206626892, "regret": 0.3506644070148468, "entropy": 0.09684807062149048, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:25:31.282832Z", "loop": 3048, "env_steps": 1873305599, "loss": 0.0019810989033430815, "avg_return": 0.4523308277130127, "regret": 0.3506644070148468, "entropy": 0.09801235795021057, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:25:32.444160Z", "loop": 3049, "env_steps": 1873919999, "loss": 0.0019972508307546377, "avg_return": 0.4575905501842499, "regret": 0.3506644070148468, "entropy": 0.09791523963212967, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:25:33.653707Z", "loop": 3050, "env_steps": 1874534399, "loss": 0.001977801090106368, "avg_return": 0.4574706554412842, "regret": 0.3506658375263214, "entropy": 0.09480778127908707, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:25:34.816006Z", "loop": 3051, "env_steps": 1875148799, "loss": 0.0022241617552936077, "avg_return": 0.4622167944908142, "regret": 0.3506658375263214, "entropy": 0.09121538698673248, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:25:35.976935Z", "loop": 3052, "env_steps": 1875763199, "loss": 0.002003834582865238, "avg_return": 0.4579857885837555, "regret": 0.3506658375263214, "entropy": 0.09038763493299484, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:25:37.137821Z", "loop": 3053, "env_steps": 1876377599, "loss": 0.0017338077304884791, "avg_return": 0.45430493354797363, "regret": 0.3506658375263214, "entropy": 0.09071735292673111, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:25:38.298840Z", "loop": 3054, "env_steps": 1876991999, "loss": 0.0015688164858147502, "avg_return": 0.45759904384613037, "regret": 0.3506658375263214, "entropy": 0.08879874646663666, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:25:39.458775Z", "loop": 3055, "env_steps": 1877606399, "loss": 0.0014855754561722279, "avg_return": 0.4457692503929138, "regret": 0.3506658375263214, "entropy": 0.09097003191709518, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:25:40.620409Z", "loop": 3056, "env_steps": 1878220799, "loss": 0.0012684426037594676, "avg_return": 0.4566977918148041, "regret": 0.3506658375263214, "entropy": 0.08874672651290894, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:25:41.780559Z", "loop": 3057, "env_steps": 1878835199, "loss": 0.0014453618787229061, "avg_return": 0.4539576470851898, "regret": 0.3506658375263214, "entropy": 0.07788512110710144, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:25:42.941275Z", "loop": 3058, "env_steps": 1879449599, "loss": 0.0013022840721532702, "avg_return": 0.4486487805843353, "regret": 0.3506658375263214, "entropy": 0.07858309894800186, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:25:44.101268Z", "loop": 3059, "env_steps": 1880063999, "loss": 0.0011836118064820766, "avg_return": 0.4546295404434204, "regret": 0.3506658375263214, "entropy": 0.0831616073846817, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:25:45.308612Z", "loop": 3060, "env_steps": 1880678399, "loss": 0.0013363288016989827, "avg_return": 0.4592234492301941, "regret": 0.3506172001361847, "entropy": 0.09034337848424911, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:25:46.470944Z", "loop": 3061, "env_steps": 1881292799, "loss": 0.001350381295196712, "avg_return": 0.45695963501930237, "regret": 0.3506172001361847, "entropy": 0.08442771434783936, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:25:47.632679Z", "loop": 3062, "env_steps": 1881907199, "loss": 0.0014426216948777437, "avg_return": 0.45363521575927734, "regret": 0.3506172001361847, "entropy": 0.08367554843425751, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:25:48.795000Z", "loop": 3063, "env_steps": 1882521599, "loss": 0.0014316103188320994, "avg_return": 0.45384451746940613, "regret": 0.3506172001361847, "entropy": 0.08471304923295975, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:25:49.956751Z", "loop": 3064, "env_steps": 1883135999, "loss": 0.0016926017124205828, "avg_return": 0.464470773935318, "regret": 0.3506172001361847, "entropy": 0.08104929327964783, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:25:51.119032Z", "loop": 3065, "env_steps": 1883750399, "loss": 0.0014408057322725654, "avg_return": 0.46098455786705017, "regret": 0.3506172001361847, "entropy": 0.08370675146579742, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:25:52.280299Z", "loop": 3066, "env_steps": 1884364799, "loss": 0.0014948428142815828, "avg_return": 0.4512383043766022, "regret": 0.3506172001361847, "entropy": 0.0858725756406784, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:25:53.441777Z", "loop": 3067, "env_steps": 1884979199, "loss": 0.0013609844027087092, "avg_return": 0.4518558382987976, "regret": 0.3506172001361847, "entropy": 0.0871191993355751, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:25:54.603275Z", "loop": 3068, "env_steps": 1885593599, "loss": 0.0013688275357708335, "avg_return": 0.4536985456943512, "regret": 0.3506172001361847, "entropy": 0.0908210501074791, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:25:55.764201Z", "loop": 3069, "env_steps": 1886207999, "loss": 0.0013635781360790133, "avg_return": 0.4548434615135193, "regret": 0.3506172001361847, "entropy": 0.08718788623809814, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:25:56.971410Z", "loop": 3070, "env_steps": 1886822399, "loss": 0.0012751598842442036, "avg_return": 0.45823049545288086, "regret": 0.3506157100200653, "entropy": 0.08695633709430695, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:25:58.132215Z", "loop": 3071, "env_steps": 1887436799, "loss": 0.0011731943814083934, "avg_return": 0.4514409601688385, "regret": 0.3506157100200653, "entropy": 0.07722607254981995, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:25:59.294214Z", "loop": 3072, "env_steps": 1888051199, "loss": 0.0011814044555649161, "avg_return": 0.4503316283226013, "regret": 0.3506157100200653, "entropy": 0.0837915912270546, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:26:00.455344Z", "loop": 3073, "env_steps": 1888665599, "loss": 0.0009487057104706764, "avg_return": 0.4474276900291443, "regret": 0.3506157100200653, "entropy": 0.07697861641645432, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:26:01.617622Z", "loop": 3074, "env_steps": 1889279999, "loss": 0.000996603979729116, "avg_return": 0.45622366666793823, "regret": 0.3506157100200653, "entropy": 0.07358703762292862, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:26:02.777982Z", "loop": 3075, "env_steps": 1889894399, "loss": 0.0009071724489331245, "avg_return": 0.45132026076316833, "regret": 0.3506157100200653, "entropy": 0.07253243029117584, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:26:03.939816Z", "loop": 3076, "env_steps": 1890508799, "loss": 0.0009139985777437687, "avg_return": 0.4511674642562866, "regret": 0.3506157100200653, "entropy": 0.07675283402204514, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:26:05.101317Z", "loop": 3077, "env_steps": 1891123199, "loss": 0.001009979983791709, "avg_return": 0.4553576409816742, "regret": 0.3506157100200653, "entropy": 0.0718739703297615, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:26:06.261920Z", "loop": 3078, "env_steps": 1891737599, "loss": 0.0010394257260486484, "avg_return": 0.4579142928123474, "regret": 0.3506157100200653, "entropy": 0.07547475397586823, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:26:07.424220Z", "loop": 3079, "env_steps": 1892351999, "loss": 0.0011257387232035398, "avg_return": 0.44626379013061523, "regret": 0.3506157100200653, "entropy": 0.07299143821001053, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:26:08.632281Z", "loop": 3080, "env_steps": 1892966399, "loss": 0.0010807303478941321, "avg_return": 0.44970235228538513, "regret": 0.3512929379940033, "entropy": 0.07229814678430557, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:26:09.793987Z", "loop": 3081, "env_steps": 1893580799, "loss": 0.0011853225296363235, "avg_return": 0.4553494453430176, "regret": 0.3512929379940033, "entropy": 0.07364960014820099, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:26:10.953971Z", "loop": 3082, "env_steps": 1894195199, "loss": 0.0014919358072802424, "avg_return": 0.4421093463897705, "regret": 0.3512929379940033, "entropy": 0.07467809319496155, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:26:12.115002Z", "loop": 3083, "env_steps": 1894809599, "loss": 0.0018523874459788203, "avg_return": 0.44998252391815186, "regret": 0.3512929379940033, "entropy": 0.07541826367378235, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:26:13.275223Z", "loop": 3084, "env_steps": 1895423999, "loss": 0.00207940093241632, "avg_return": 0.4521576166152954, "regret": 0.3512929379940033, "entropy": 0.08124073594808578, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:26:14.435373Z", "loop": 3085, "env_steps": 1896038399, "loss": 0.002531682373955846, "avg_return": 0.45010310411453247, "regret": 0.3512929379940033, "entropy": 0.09072219580411911, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:26:15.596749Z", "loop": 3086, "env_steps": 1896652799, "loss": 0.0023434029426425695, "avg_return": 0.44818350672721863, "regret": 0.3512929379940033, "entropy": 0.08645813912153244, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:26:16.757110Z", "loop": 3087, "env_steps": 1897267199, "loss": 0.002466475125402212, "avg_return": 0.4521978795528412, "regret": 0.3512929379940033, "entropy": 0.08385185897350311, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:26:17.918381Z", "loop": 3088, "env_steps": 1897881599, "loss": 0.00217147427611053, "avg_return": 0.44848063588142395, "regret": 0.3512929379940033, "entropy": 0.0844782218337059, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:26:19.077790Z", "loop": 3089, "env_steps": 1898495999, "loss": 0.002213447354733944, "avg_return": 0.450128436088562, "regret": 0.3512929379940033, "entropy": 0.08023142069578171, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:26:20.283701Z", "loop": 3090, "env_steps": 1899110399, "loss": 0.0018735064659267664, "avg_return": 0.44348907470703125, "regret": 0.3547985553741455, "entropy": 0.07827703654766083, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:26:21.445119Z", "loop": 3091, "env_steps": 1899724799, "loss": 0.0023312473203986883, "avg_return": 0.4563148617744446, "regret": 0.3547985553741455, "entropy": 0.07821580767631531, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:26:22.607499Z", "loop": 3092, "env_steps": 1900339199, "loss": 0.0024032024666666985, "avg_return": 0.4542170464992523, "regret": 0.3547985553741455, "entropy": 0.08555884659290314, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:26:23.768634Z", "loop": 3093, "env_steps": 1900953599, "loss": 0.0023175745736807585, "avg_return": 0.4502122104167938, "regret": 0.3547985553741455, "entropy": 0.08759785443544388, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:26:24.929697Z", "loop": 3094, "env_steps": 1901567999, "loss": 0.0023222228046506643, "avg_return": 0.4511277377605438, "regret": 0.3547985553741455, "entropy": 0.08724328875541687, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:26:26.089591Z", "loop": 3095, "env_steps": 1902182399, "loss": 0.0027098297141492367, "avg_return": 0.45706361532211304, "regret": 0.3547985553741455, "entropy": 0.09043017029762268, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:26:27.250172Z", "loop": 3096, "env_steps": 1902796799, "loss": 0.002416257979348302, "avg_return": 0.44941312074661255, "regret": 0.3547985553741455, "entropy": 0.09420568495988846, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:26:28.411860Z", "loop": 3097, "env_steps": 1903411199, "loss": 0.002431532833725214, "avg_return": 0.4478216767311096, "regret": 0.3547985553741455, "entropy": 0.09126016497612, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:26:29.572210Z", "loop": 3098, "env_steps": 1904025599, "loss": 0.0025792093947529793, "avg_return": 0.455063134431839, "regret": 0.3547985553741455, "entropy": 0.09098606556653976, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:26:30.733239Z", "loop": 3099, "env_steps": 1904639999, "loss": 0.0024691747967153788, "avg_return": 0.4546584188938141, "regret": 0.3547985553741455, "entropy": 0.09040577709674835, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:26:31.938370Z", "loop": 3100, "env_steps": 1905254399, "loss": 0.0023716548457741737, "avg_return": 0.45248979330062866, "regret": 0.35173070430755615, "entropy": 0.09423062205314636, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:26:33.101267Z", "loop": 3101, "env_steps": 1905868799, "loss": 0.0024121140595525503, "avg_return": 0.44663289189338684, "regret": 0.35173070430755615, "entropy": 0.09877666085958481, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:26:34.264343Z", "loop": 3102, "env_steps": 1906483199, "loss": 0.0025362945161759853, "avg_return": 0.4499951899051666, "regret": 0.35173070430755615, "entropy": 0.08949057757854462, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:26:35.425921Z", "loop": 3103, "env_steps": 1907097599, "loss": 0.0026474171318113804, "avg_return": 0.45051977038383484, "regret": 0.35173070430755615, "entropy": 0.09631241112947464, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:26:36.586165Z", "loop": 3104, "env_steps": 1907711999, "loss": 0.002537485910579562, "avg_return": 0.45285940170288086, "regret": 0.35173070430755615, "entropy": 0.09814643859863281, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:26:37.748432Z", "loop": 3105, "env_steps": 1908326399, "loss": 0.002328908536583185, "avg_return": 0.456670343875885, "regret": 0.35173070430755615, "entropy": 0.08831022679805756, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:26:38.911291Z", "loop": 3106, "env_steps": 1908940799, "loss": 0.0015619267942383885, "avg_return": 0.4385710656642914, "regret": 0.35173070430755615, "entropy": 0.07354561239480972, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:26:40.071336Z", "loop": 3107, "env_steps": 1909555199, "loss": 0.001213599694892764, "avg_return": 0.45192667841911316, "regret": 0.35173070430755615, "entropy": 0.07357772439718246, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:26:41.232746Z", "loop": 3108, "env_steps": 1910169599, "loss": 0.0009268368594348431, "avg_return": 0.4456537067890167, "regret": 0.35173070430755615, "entropy": 0.06520646810531616, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:26:42.392940Z", "loop": 3109, "env_steps": 1910783999, "loss": 0.0008161989971995354, "avg_return": 0.45050501823425293, "regret": 0.35173070430755615, "entropy": 0.06735822558403015, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:26:43.604688Z", "loop": 3110, "env_steps": 1911398399, "loss": 0.0009554963908158243, "avg_return": 0.4499433636665344, "regret": 0.3554147779941559, "entropy": 0.06173441559076309, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:26:44.766971Z", "loop": 3111, "env_steps": 1912012799, "loss": 0.0010431719711050391, "avg_return": 0.45450833439826965, "regret": 0.3554147779941559, "entropy": 0.06382200866937637, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:26:45.927987Z", "loop": 3112, "env_steps": 1912627199, "loss": 0.0010130176087841392, "avg_return": 0.4412270784378052, "regret": 0.3554147779941559, "entropy": 0.06751339137554169, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:26:47.089854Z", "loop": 3113, "env_steps": 1913241599, "loss": 0.0010990897426381707, "avg_return": 0.452146053314209, "regret": 0.3554147779941559, "entropy": 0.06742360442876816, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:26:48.251462Z", "loop": 3114, "env_steps": 1913855999, "loss": 0.0011565869208425283, "avg_return": 0.44401684403419495, "regret": 0.3554147779941559, "entropy": 0.06988400220870972, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:26:49.413863Z", "loop": 3115, "env_steps": 1914470399, "loss": 0.001110799377784133, "avg_return": 0.44066762924194336, "regret": 0.3554147779941559, "entropy": 0.06986663490533829, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:26:50.574261Z", "loop": 3116, "env_steps": 1915084799, "loss": 0.0009907514322549105, "avg_return": 0.4509815573692322, "regret": 0.3554147779941559, "entropy": 0.06883863359689713, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:26:51.735117Z", "loop": 3117, "env_steps": 1915699199, "loss": 0.0009033373789861798, "avg_return": 0.4505312740802765, "regret": 0.3554147779941559, "entropy": 0.06550750881433487, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:26:52.901362Z", "loop": 3118, "env_steps": 1916313599, "loss": 0.0010004647774621844, "avg_return": 0.447457492351532, "regret": 0.3554147779941559, "entropy": 0.06402687728404999, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:26:54.061911Z", "loop": 3119, "env_steps": 1916927999, "loss": 0.0010165824787691236, "avg_return": 0.44530412554740906, "regret": 0.3554147779941559, "entropy": 0.06841666251420975, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:26:55.274515Z", "loop": 3120, "env_steps": 1917542399, "loss": 0.0011675558052957058, "avg_return": 0.4506910443305969, "regret": 0.3525818884372711, "entropy": 0.07032880932092667, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:26:56.436610Z", "loop": 3121, "env_steps": 1918156799, "loss": 0.0017215913394466043, "avg_return": 0.4496169090270996, "regret": 0.3525818884372711, "entropy": 0.07556848973035812, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:26:57.597667Z", "loop": 3122, "env_steps": 1918771199, "loss": 0.002182570518925786, "avg_return": 0.44736284017562866, "regret": 0.3525818884372711, "entropy": 0.0996253564953804, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:26:58.757128Z", "loop": 3123, "env_steps": 1919385599, "loss": 0.002480890369042754, "avg_return": 0.4504722058773041, "regret": 0.3525818884372711, "entropy": 0.10616668313741684, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:26:59.918313Z", "loop": 3124, "env_steps": 1919999999, "loss": 0.0029116494115442038, "avg_return": 0.44860291481018066, "regret": 0.3525818884372711, "entropy": 0.1110556349158287, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:27:01.079218Z", "loop": 3125, "env_steps": 1920614399, "loss": 0.0027128071524202824, "avg_return": 0.4512184262275696, "regret": 0.3525818884372711, "entropy": 0.1033899337053299, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:27:02.239371Z", "loop": 3126, "env_steps": 1921228799, "loss": 0.0027631816919893026, "avg_return": 0.450913667678833, "regret": 0.3525818884372711, "entropy": 0.10471231490373611, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:27:03.400492Z", "loop": 3127, "env_steps": 1921843199, "loss": 0.002478368114680052, "avg_return": 0.450338751077652, "regret": 0.3525818884372711, "entropy": 0.09847736358642578, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:27:04.561537Z", "loop": 3128, "env_steps": 1922457599, "loss": 0.0020889288280159235, "avg_return": 0.45526590943336487, "regret": 0.3525818884372711, "entropy": 0.0995430201292038, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:27:05.725669Z", "loop": 3129, "env_steps": 1923071999, "loss": 0.0019244039431214333, "avg_return": 0.4520016610622406, "regret": 0.3525818884372711, "entropy": 0.09125819802284241, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:27:06.931714Z", "loop": 3130, "env_steps": 1923686399, "loss": 0.0015323148109018803, "avg_return": 0.4593155086040497, "regret": 0.3508383333683014, "entropy": 0.0833500400185585, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:27:08.093101Z", "loop": 3131, "env_steps": 1924300799, "loss": 0.001425755093805492, "avg_return": 0.45760083198547363, "regret": 0.3508383333683014, "entropy": 0.0862676352262497, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:27:09.254267Z", "loop": 3132, "env_steps": 1924915199, "loss": 0.0010268635815009475, "avg_return": 0.4536077380180359, "regret": 0.3508383333683014, "entropy": 0.08251643925905228, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:27:10.417268Z", "loop": 3133, "env_steps": 1925529599, "loss": 0.0007239932892844081, "avg_return": 0.45423176884651184, "regret": 0.3508383333683014, "entropy": 0.0815911665558815, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:27:11.578869Z", "loop": 3134, "env_steps": 1926143999, "loss": 0.000726790982298553, "avg_return": 0.4558098316192627, "regret": 0.3508383333683014, "entropy": 0.07713314890861511, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:27:12.739400Z", "loop": 3135, "env_steps": 1926758399, "loss": 0.0010046305833384395, "avg_return": 0.45073801279067993, "regret": 0.3508383333683014, "entropy": 0.07305385172367096, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:27:13.900845Z", "loop": 3136, "env_steps": 1927372799, "loss": 0.0011486040893942118, "avg_return": 0.45489931106567383, "regret": 0.3508383333683014, "entropy": 0.07270070910453796, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:27:15.061890Z", "loop": 3137, "env_steps": 1927987199, "loss": 0.0014050162862986326, "avg_return": 0.4533543586730957, "regret": 0.3508383333683014, "entropy": 0.08147256821393967, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:27:16.224478Z", "loop": 3138, "env_steps": 1928601599, "loss": 0.0016649879980832338, "avg_return": 0.4577140510082245, "regret": 0.3508383333683014, "entropy": 0.08273039013147354, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:27:17.385988Z", "loop": 3139, "env_steps": 1929215999, "loss": 0.0012904790928587317, "avg_return": 0.4577704071998596, "regret": 0.3508383333683014, "entropy": 0.0721743181347847, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:27:18.594930Z", "loop": 3140, "env_steps": 1929830399, "loss": 0.0013017882592976093, "avg_return": 0.44582849740982056, "regret": 0.35079050064086914, "entropy": 0.07590927928686142, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:27:19.757517Z", "loop": 3141, "env_steps": 1930444799, "loss": 0.0015650785062462091, "avg_return": 0.45081812143325806, "regret": 0.35079050064086914, "entropy": 0.07093562185764313, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:27:20.919244Z", "loop": 3142, "env_steps": 1931059199, "loss": 0.0016788954380899668, "avg_return": 0.4567315876483917, "regret": 0.35079050064086914, "entropy": 0.0700182393193245, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:27:22.081264Z", "loop": 3143, "env_steps": 1931673599, "loss": 0.0020241818856447935, "avg_return": 0.4573804438114166, "regret": 0.35079050064086914, "entropy": 0.07493014633655548, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:27:23.242423Z", "loop": 3144, "env_steps": 1932287999, "loss": 0.001777907833456993, "avg_return": 0.45100149512290955, "regret": 0.35079050064086914, "entropy": 0.07685118913650513, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:27:24.404497Z", "loop": 3145, "env_steps": 1932902399, "loss": 0.001740536536090076, "avg_return": 0.45644399523735046, "regret": 0.35079050064086914, "entropy": 0.07173403352499008, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:27:25.565427Z", "loop": 3146, "env_steps": 1933516799, "loss": 0.0017259049927815795, "avg_return": 0.45465272665023804, "regret": 0.35079050064086914, "entropy": 0.07553460448980331, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:27:26.726207Z", "loop": 3147, "env_steps": 1934131199, "loss": 0.001665417687036097, "avg_return": 0.4479304552078247, "regret": 0.35079050064086914, "entropy": 0.06775430589914322, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:27:27.888058Z", "loop": 3148, "env_steps": 1934745599, "loss": 0.001452851458452642, "avg_return": 0.452953964471817, "regret": 0.35079050064086914, "entropy": 0.06733613461256027, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:27:29.048376Z", "loop": 3149, "env_steps": 1935359999, "loss": 0.001172335585579276, "avg_return": 0.4581504464149475, "regret": 0.35079050064086914, "entropy": 0.07283436506986618, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:27:30.255406Z", "loop": 3150, "env_steps": 1935974399, "loss": 0.0011185408802703023, "avg_return": 0.45125943422317505, "regret": 0.3507697284221649, "entropy": 0.07047203183174133, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:27:31.416668Z", "loop": 3151, "env_steps": 1936588799, "loss": 0.001014215755276382, "avg_return": 0.454169362783432, "regret": 0.3507697284221649, "entropy": 0.07033280283212662, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:27:32.578934Z", "loop": 3152, "env_steps": 1937203199, "loss": 0.0010721671860665083, "avg_return": 0.44805634021759033, "regret": 0.3507697284221649, "entropy": 0.06759734451770782, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:27:33.740626Z", "loop": 3153, "env_steps": 1937817599, "loss": 0.0011166486656293273, "avg_return": 0.4477831721305847, "regret": 0.3507697284221649, "entropy": 0.06791014969348907, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:27:34.902979Z", "loop": 3154, "env_steps": 1938431999, "loss": 0.0011115953093394637, "avg_return": 0.454633891582489, "regret": 0.3507697284221649, "entropy": 0.06559175997972488, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:27:36.063678Z", "loop": 3155, "env_steps": 1939046399, "loss": 0.0009311485337093472, "avg_return": 0.45459675788879395, "regret": 0.3507697284221649, "entropy": 0.06711918115615845, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:27:37.225316Z", "loop": 3156, "env_steps": 1939660799, "loss": 0.0013631837209686637, "avg_return": 0.4553907513618469, "regret": 0.3507697284221649, "entropy": 0.06956978142261505, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:27:38.387275Z", "loop": 3157, "env_steps": 1940275199, "loss": 0.001024510944262147, "avg_return": 0.45004990696907043, "regret": 0.3507697284221649, "entropy": 0.07533811032772064, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:27:39.548050Z", "loop": 3158, "env_steps": 1940889599, "loss": 0.0010056825121864676, "avg_return": 0.45243123173713684, "regret": 0.3507697284221649, "entropy": 0.06526835262775421, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:27:40.710745Z", "loop": 3159, "env_steps": 1941503999, "loss": 0.0011526909656822681, "avg_return": 0.45485901832580566, "regret": 0.3507697284221649, "entropy": 0.07060348242521286, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:27:41.922303Z", "loop": 3160, "env_steps": 1942118399, "loss": 0.0012054219841957092, "avg_return": 0.4461633861064911, "regret": 0.3506748080253601, "entropy": 0.06575552374124527, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:27:43.083962Z", "loop": 3161, "env_steps": 1942732799, "loss": 0.0011003807885572314, "avg_return": 0.4501180052757263, "regret": 0.3506748080253601, "entropy": 0.0712408497929573, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:27:44.244672Z", "loop": 3162, "env_steps": 1943347199, "loss": 0.001106088049709797, "avg_return": 0.45647355914115906, "regret": 0.3506748080253601, "entropy": 0.06623580306768417, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:27:45.406508Z", "loop": 3163, "env_steps": 1943961599, "loss": 0.001280442695133388, "avg_return": 0.45582595467567444, "regret": 0.3506748080253601, "entropy": 0.07134959846735, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:27:46.568900Z", "loop": 3164, "env_steps": 1944575999, "loss": 0.0012261649826541543, "avg_return": 0.46199241280555725, "regret": 0.3506748080253601, "entropy": 0.06863455474376678, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:27:47.730475Z", "loop": 3165, "env_steps": 1945190399, "loss": 0.0011094019282609224, "avg_return": 0.4442363679409027, "regret": 0.3506748080253601, "entropy": 0.06763551384210587, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:27:48.892299Z", "loop": 3166, "env_steps": 1945804799, "loss": 0.0011994859669357538, "avg_return": 0.45701858401298523, "regret": 0.3506748080253601, "entropy": 0.06583204865455627, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:27:50.052496Z", "loop": 3167, "env_steps": 1946419199, "loss": 0.0012357080122455955, "avg_return": 0.4558444321155548, "regret": 0.3506748080253601, "entropy": 0.07092121243476868, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:27:51.214320Z", "loop": 3168, "env_steps": 1947033599, "loss": 0.0012518572621047497, "avg_return": 0.45337408781051636, "regret": 0.3506748080253601, "entropy": 0.06787238270044327, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:27:52.378220Z", "loop": 3169, "env_steps": 1947647999, "loss": 0.0010816057911142707, "avg_return": 0.4577732980251312, "regret": 0.3506748080253601, "entropy": 0.0733204036951065, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:27:53.586171Z", "loop": 3170, "env_steps": 1948262399, "loss": 0.0010858668247237802, "avg_return": 0.4469943940639496, "regret": 0.3506558835506439, "entropy": 0.06795027107000351, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:27:54.747655Z", "loop": 3171, "env_steps": 1948876799, "loss": 0.001053534564562142, "avg_return": 0.45018982887268066, "regret": 0.3506558835506439, "entropy": 0.06904056668281555, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:27:55.908557Z", "loop": 3172, "env_steps": 1949491199, "loss": 0.001102365436963737, "avg_return": 0.45710083842277527, "regret": 0.3506558835506439, "entropy": 0.06494057178497314, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:27:57.071549Z", "loop": 3173, "env_steps": 1950105599, "loss": 0.00135294150095433, "avg_return": 0.4494568407535553, "regret": 0.3506558835506439, "entropy": 0.06688468158245087, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:27:58.232621Z", "loop": 3174, "env_steps": 1950719999, "loss": 0.0011173792881891131, "avg_return": 0.4587958753108978, "regret": 0.3506558835506439, "entropy": 0.06721536070108414, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:27:59.393506Z", "loop": 3175, "env_steps": 1951334399, "loss": 0.0010209105676040053, "avg_return": 0.44677889347076416, "regret": 0.3506558835506439, "entropy": 0.06603440642356873, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:28:00.553395Z", "loop": 3176, "env_steps": 1951948799, "loss": 0.0011003251420333982, "avg_return": 0.4563756287097931, "regret": 0.3506558835506439, "entropy": 0.07217729836702347, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:28:01.714222Z", "loop": 3177, "env_steps": 1952563199, "loss": 0.001070602098479867, "avg_return": 0.45113232731819153, "regret": 0.3506558835506439, "entropy": 0.06860989332199097, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:28:02.876556Z", "loop": 3178, "env_steps": 1953177599, "loss": 0.0012127466034144163, "avg_return": 0.46032676100730896, "regret": 0.3506558835506439, "entropy": 0.06844988465309143, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:28:04.037072Z", "loop": 3179, "env_steps": 1953791999, "loss": 0.0013482511276379228, "avg_return": 0.4610094428062439, "regret": 0.3506558835506439, "entropy": 0.07095877081155777, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:28:05.247078Z", "loop": 3180, "env_steps": 1954406399, "loss": 0.0013941366923972964, "avg_return": 0.45978018641471863, "regret": 0.3507457375526428, "entropy": 0.06968875229358673, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:28:06.409340Z", "loop": 3181, "env_steps": 1955020799, "loss": 0.0012477361597120762, "avg_return": 0.4512196481227875, "regret": 0.3507457375526428, "entropy": 0.06923021376132965, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:28:07.571585Z", "loop": 3182, "env_steps": 1955635199, "loss": 0.0010721165454015136, "avg_return": 0.4416793882846832, "regret": 0.3507457375526428, "entropy": 0.06855110079050064, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:28:08.732566Z", "loop": 3183, "env_steps": 1956249599, "loss": 0.000984152196906507, "avg_return": 0.4555145502090454, "regret": 0.3507457375526428, "entropy": 0.06688663363456726, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:28:09.894444Z", "loop": 3184, "env_steps": 1956863999, "loss": 0.0009731512400321662, "avg_return": 0.45426708459854126, "regret": 0.3507457375526428, "entropy": 0.06823110580444336, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:28:11.054995Z", "loop": 3185, "env_steps": 1957478399, "loss": 0.0008326765382662416, "avg_return": 0.45455944538116455, "regret": 0.3507457375526428, "entropy": 0.07127593457698822, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:28:12.216224Z", "loop": 3186, "env_steps": 1958092799, "loss": 0.0008587349439039826, "avg_return": 0.4549962878227234, "regret": 0.3507457375526428, "entropy": 0.06968962401151657, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:28:13.379058Z", "loop": 3187, "env_steps": 1958707199, "loss": 0.000729034305550158, "avg_return": 0.4509637951850891, "regret": 0.3507457375526428, "entropy": 0.07144239544868469, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:28:14.540182Z", "loop": 3188, "env_steps": 1959321599, "loss": 0.00085400854004547, "avg_return": 0.4483271837234497, "regret": 0.3507457375526428, "entropy": 0.07352124899625778, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:28:15.701689Z", "loop": 3189, "env_steps": 1959935999, "loss": 0.0008111060014925897, "avg_return": 0.4471445381641388, "regret": 0.3507457375526428, "entropy": 0.07385879009962082, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:28:16.910326Z", "loop": 3190, "env_steps": 1960550399, "loss": 0.0009601671481505036, "avg_return": 0.4561367332935333, "regret": 0.3511379063129425, "entropy": 0.07635768502950668, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:28:18.072319Z", "loop": 3191, "env_steps": 1961164799, "loss": 0.0010993583127856255, "avg_return": 0.4669637084007263, "regret": 0.3511379063129425, "entropy": 0.07039608061313629, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:28:19.234103Z", "loop": 3192, "env_steps": 1961779199, "loss": 0.000988118234090507, "avg_return": 0.44270357489585876, "regret": 0.3511379063129425, "entropy": 0.07686478644609451, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:28:20.394803Z", "loop": 3193, "env_steps": 1962393599, "loss": 0.001071442267857492, "avg_return": 0.45600026845932007, "regret": 0.3511379063129425, "entropy": 0.07507804781198502, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:28:21.556890Z", "loop": 3194, "env_steps": 1963007999, "loss": 0.0009592600399628282, "avg_return": 0.4510468542575836, "regret": 0.3511379063129425, "entropy": 0.07375121861696243, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:28:22.717833Z", "loop": 3195, "env_steps": 1963622399, "loss": 0.0010945870308205485, "avg_return": 0.45533648133277893, "regret": 0.3511379063129425, "entropy": 0.07536252588033676, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:28:23.882576Z", "loop": 3196, "env_steps": 1964236799, "loss": 0.0011389110004529357, "avg_return": 0.45436179637908936, "regret": 0.3511379063129425, "entropy": 0.08034763485193253, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:28:25.043578Z", "loop": 3197, "env_steps": 1964851199, "loss": 0.0011760444613173604, "avg_return": 0.44071561098098755, "regret": 0.3511379063129425, "entropy": 0.08739633858203888, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:28:26.204274Z", "loop": 3198, "env_steps": 1965465599, "loss": 0.0012514002155512571, "avg_return": 0.45804229378700256, "regret": 0.3511379063129425, "entropy": 0.07661222666501999, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:28:27.366433Z", "loop": 3199, "env_steps": 1966079999, "loss": 0.001724426867440343, "avg_return": 0.45836126804351807, "regret": 0.3511379063129425, "entropy": 0.08685249835252762, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:28:28.577295Z", "loop": 3200, "env_steps": 1966694399, "loss": 0.0020456721540540457, "avg_return": 0.4542715549468994, "regret": 0.35082167387008667, "entropy": 0.08332647383213043, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:28:29.740347Z", "loop": 3201, "env_steps": 1967308799, "loss": 0.002046958776190877, "avg_return": 0.44866567850112915, "regret": 0.35082167387008667, "entropy": 0.09457970410585403, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:28:30.901553Z", "loop": 3202, "env_steps": 1967923199, "loss": 0.0023687100037932396, "avg_return": 0.4590391516685486, "regret": 0.35082167387008667, "entropy": 0.10007459670305252, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:28:32.063192Z", "loop": 3203, "env_steps": 1968537599, "loss": 0.0022159290965646505, "avg_return": 0.45976412296295166, "regret": 0.35082167387008667, "entropy": 0.0893537700176239, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:28:33.223416Z", "loop": 3204, "env_steps": 1969151999, "loss": 0.0018268583808094263, "avg_return": 0.45473629236221313, "regret": 0.35082167387008667, "entropy": 0.08744622021913528, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:28:34.386228Z", "loop": 3205, "env_steps": 1969766399, "loss": 0.0014273308916017413, "avg_return": 0.4560900032520294, "regret": 0.35082167387008667, "entropy": 0.07810261100530624, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:28:35.547185Z", "loop": 3206, "env_steps": 1970380799, "loss": 0.0010543278185650706, "avg_return": 0.4521850049495697, "regret": 0.35082167387008667, "entropy": 0.07504065334796906, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:28:36.708585Z", "loop": 3207, "env_steps": 1970995199, "loss": 0.0009230600553564727, "avg_return": 0.45889559388160706, "regret": 0.35082167387008667, "entropy": 0.07115419954061508, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:28:37.870675Z", "loop": 3208, "env_steps": 1971609599, "loss": 0.0008997049299068749, "avg_return": 0.44435569643974304, "regret": 0.35082167387008667, "entropy": 0.07368209958076477, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:28:39.030710Z", "loop": 3209, "env_steps": 1972223999, "loss": 0.0010386309586465359, "avg_return": 0.4531129002571106, "regret": 0.35082167387008667, "entropy": 0.07345209270715714, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:28:40.240507Z", "loop": 3210, "env_steps": 1972838399, "loss": 0.001138838124461472, "avg_return": 0.4551302194595337, "regret": 0.35066983103752136, "entropy": 0.06883934885263443, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:28:41.401948Z", "loop": 3211, "env_steps": 1973452799, "loss": 0.0011596882250159979, "avg_return": 0.4404946565628052, "regret": 0.35066983103752136, "entropy": 0.072801873087883, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:28:42.563347Z", "loop": 3212, "env_steps": 1974067199, "loss": 0.0015076748095452785, "avg_return": 0.45315054059028625, "regret": 0.35066983103752136, "entropy": 0.06904149055480957, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:28:43.724097Z", "loop": 3213, "env_steps": 1974681599, "loss": 0.0014248255174607038, "avg_return": 0.4529053866863251, "regret": 0.35066983103752136, "entropy": 0.07235000282526016, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:28:44.885653Z", "loop": 3214, "env_steps": 1975295999, "loss": 0.00129317631945014, "avg_return": 0.451752632856369, "regret": 0.35066983103752136, "entropy": 0.0770396888256073, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:28:46.047489Z", "loop": 3215, "env_steps": 1975910399, "loss": 0.0011836484773084521, "avg_return": 0.45451682806015015, "regret": 0.35066983103752136, "entropy": 0.07276605069637299, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:28:47.208722Z", "loop": 3216, "env_steps": 1976524799, "loss": 0.0012978940503671765, "avg_return": 0.4549858570098877, "regret": 0.35066983103752136, "entropy": 0.07142309099435806, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:28:48.370654Z", "loop": 3217, "env_steps": 1977139199, "loss": 0.0011224310146644711, "avg_return": 0.44863659143447876, "regret": 0.35066983103752136, "entropy": 0.07053062319755554, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:28:49.530877Z", "loop": 3218, "env_steps": 1977753599, "loss": 0.0010859620524570346, "avg_return": 0.4479714035987854, "regret": 0.35066983103752136, "entropy": 0.07215927541255951, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:28:50.697131Z", "loop": 3219, "env_steps": 1978367999, "loss": 0.0009010028443299234, "avg_return": 0.4437847137451172, "regret": 0.35066983103752136, "entropy": 0.06927140802145004, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:28:51.907539Z", "loop": 3220, "env_steps": 1978982399, "loss": 0.0007818072335794568, "avg_return": 0.4485008716583252, "regret": 0.35067033767700195, "entropy": 0.06979675590991974, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:28:53.068178Z", "loop": 3221, "env_steps": 1979596799, "loss": 0.0008788313716650009, "avg_return": 0.4510558247566223, "regret": 0.35067033767700195, "entropy": 0.06791076809167862, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:28:54.228867Z", "loop": 3222, "env_steps": 1980211199, "loss": 0.0007799442973919213, "avg_return": 0.4482935667037964, "regret": 0.35067033767700195, "entropy": 0.067604199051857, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:28:55.389886Z", "loop": 3223, "env_steps": 1980825599, "loss": 0.0008428259170614183, "avg_return": 0.4543081223964691, "regret": 0.35067033767700195, "entropy": 0.06640885025262833, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:28:56.551881Z", "loop": 3224, "env_steps": 1981439999, "loss": 0.0007984416442923248, "avg_return": 0.4514751434326172, "regret": 0.35067033767700195, "entropy": 0.06279103457927704, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:28:57.713032Z", "loop": 3225, "env_steps": 1982054399, "loss": 0.000922224426176399, "avg_return": 0.44817984104156494, "regret": 0.35067033767700195, "entropy": 0.06303671002388, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:28:58.874731Z", "loop": 3226, "env_steps": 1982668799, "loss": 0.000957162061240524, "avg_return": 0.45260289311408997, "regret": 0.35067033767700195, "entropy": 0.06444313377141953, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:29:00.035210Z", "loop": 3227, "env_steps": 1983283199, "loss": 0.0007916443282738328, "avg_return": 0.4452183246612549, "regret": 0.35067033767700195, "entropy": 0.07016174495220184, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:29:01.196180Z", "loop": 3228, "env_steps": 1983897599, "loss": 0.0010375319980084896, "avg_return": 0.44824036955833435, "regret": 0.35067033767700195, "entropy": 0.06391505897045135, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:29:02.357963Z", "loop": 3229, "env_steps": 1984511999, "loss": 0.0009657497867010534, "avg_return": 0.44791698455810547, "regret": 0.35067033767700195, "entropy": 0.0676477923989296, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:29:03.567084Z", "loop": 3230, "env_steps": 1985126399, "loss": 0.0010460215853527188, "avg_return": 0.45580190420150757, "regret": 0.35071903467178345, "entropy": 0.06357967853546143, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:29:04.728852Z", "loop": 3231, "env_steps": 1985740799, "loss": 0.0011360436910763383, "avg_return": 0.4585185945034027, "regret": 0.35071903467178345, "entropy": 0.06663178652524948, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:29:05.890113Z", "loop": 3232, "env_steps": 1986355199, "loss": 0.0009911293163895607, "avg_return": 0.4530010223388672, "regret": 0.35071903467178345, "entropy": 0.06468735635280609, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:29:07.052832Z", "loop": 3233, "env_steps": 1986969599, "loss": 0.0009033381938934326, "avg_return": 0.44856929779052734, "regret": 0.35071903467178345, "entropy": 0.06994803249835968, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:29:08.213388Z", "loop": 3234, "env_steps": 1987583999, "loss": 0.0009332417394034564, "avg_return": 0.4560696482658386, "regret": 0.35071903467178345, "entropy": 0.05977940931916237, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:29:09.375159Z", "loop": 3235, "env_steps": 1988198399, "loss": 0.0009334664791822433, "avg_return": 0.4501708447933197, "regret": 0.35071903467178345, "entropy": 0.06151430308818817, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:29:10.537543Z", "loop": 3236, "env_steps": 1988812799, "loss": 0.0007826524088159204, "avg_return": 0.45525848865509033, "regret": 0.35071903467178345, "entropy": 0.06477560847997665, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:29:11.699275Z", "loop": 3237, "env_steps": 1989427199, "loss": 0.0007551144226454198, "avg_return": 0.45032787322998047, "regret": 0.35071903467178345, "entropy": 0.06594555824995041, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:29:12.861290Z", "loop": 3238, "env_steps": 1990041599, "loss": 0.0007307567284442484, "avg_return": 0.4446796774864197, "regret": 0.35071903467178345, "entropy": 0.06093765050172806, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:29:14.021422Z", "loop": 3239, "env_steps": 1990655999, "loss": 0.0007260770653374493, "avg_return": 0.4500409960746765, "regret": 0.35071903467178345, "entropy": 0.0630224198102951, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:29:15.232386Z", "loop": 3240, "env_steps": 1991270399, "loss": 0.000617512094322592, "avg_return": 0.45800018310546875, "regret": 0.3506805896759033, "entropy": 0.06130293384194374, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:29:16.393057Z", "loop": 3241, "env_steps": 1991884799, "loss": 0.0005394441541284323, "avg_return": 0.45537543296813965, "regret": 0.3506805896759033, "entropy": 0.06736882030963898, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:29:17.554874Z", "loop": 3242, "env_steps": 1992499199, "loss": 0.0005874269409105182, "avg_return": 0.44991302490234375, "regret": 0.3506805896759033, "entropy": 0.06491091102361679, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:29:18.715817Z", "loop": 3243, "env_steps": 1993113599, "loss": 0.0005530673079192638, "avg_return": 0.45373964309692383, "regret": 0.3506805896759033, "entropy": 0.06203584372997284, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:29:19.878161Z", "loop": 3244, "env_steps": 1993727999, "loss": 0.0007880643825046718, "avg_return": 0.45787689089775085, "regret": 0.3506805896759033, "entropy": 0.07093574851751328, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:29:21.041160Z", "loop": 3245, "env_steps": 1994342399, "loss": 0.0005996389663778245, "avg_return": 0.4514337182044983, "regret": 0.3506805896759033, "entropy": 0.0657794326543808, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:29:22.203726Z", "loop": 3246, "env_steps": 1994956799, "loss": 0.0006981041515246034, "avg_return": 0.45083415508270264, "regret": 0.3506805896759033, "entropy": 0.06766632199287415, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:29:23.365313Z", "loop": 3247, "env_steps": 1995571199, "loss": 0.0008021746762096882, "avg_return": 0.45553141832351685, "regret": 0.3506805896759033, "entropy": 0.07127192616462708, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:29:24.526669Z", "loop": 3248, "env_steps": 1996185599, "loss": 0.0007909933920018375, "avg_return": 0.45430755615234375, "regret": 0.3506805896759033, "entropy": 0.06658099591732025, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:29:25.686782Z", "loop": 3249, "env_steps": 1996799999, "loss": 0.0008322513895109296, "avg_return": 0.4440958797931671, "regret": 0.3506805896759033, "entropy": 0.07149139791727066, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:29:26.893027Z", "loop": 3250, "env_steps": 1997414399, "loss": 0.0008589687058702111, "avg_return": 0.4545852243900299, "regret": 0.3510074317455292, "entropy": 0.0765252634882927, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:29:28.055462Z", "loop": 3251, "env_steps": 1998028799, "loss": 0.00099059974309057, "avg_return": 0.4575974643230438, "regret": 0.3510074317455292, "entropy": 0.07186225801706314, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:29:29.215659Z", "loop": 3252, "env_steps": 1998643199, "loss": 0.000904303917195648, "avg_return": 0.44773346185684204, "regret": 0.3510074317455292, "entropy": 0.07365116477012634, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:29:30.376494Z", "loop": 3253, "env_steps": 1999257599, "loss": 0.0007583426777273417, "avg_return": 0.4547992944717407, "regret": 0.3510074317455292, "entropy": 0.07248852401971817, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:29:31.539610Z", "loop": 3254, "env_steps": 1999871999, "loss": 0.000844480178784579, "avg_return": 0.4562056064605713, "regret": 0.3510074317455292, "entropy": 0.07419098168611526, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:29:32.701764Z", "loop": 3255, "env_steps": 2000486399, "loss": 0.0006462494493462145, "avg_return": 0.4531232714653015, "regret": 0.3510074317455292, "entropy": 0.06668305397033691, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:29:33.863518Z", "loop": 3256, "env_steps": 2001100799, "loss": 0.0007769038784317672, "avg_return": 0.4520426094532013, "regret": 0.3510074317455292, "entropy": 0.06568469107151031, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:29:35.023526Z", "loop": 3257, "env_steps": 2001715199, "loss": 0.0007939509232528508, "avg_return": 0.4539835751056671, "regret": 0.3510074317455292, "entropy": 0.0742659717798233, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:29:36.184690Z", "loop": 3258, "env_steps": 2002329599, "loss": 0.0009469676879234612, "avg_return": 0.4514494836330414, "regret": 0.3510074317455292, "entropy": 0.06905090063810349, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:29:37.348056Z", "loop": 3259, "env_steps": 2002943999, "loss": 0.0008557824767194688, "avg_return": 0.4560028314590454, "regret": 0.3510074317455292, "entropy": 0.06760864704847336, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:29:38.555656Z", "loop": 3260, "env_steps": 2003558399, "loss": 0.0008838166831992567, "avg_return": 0.45069652795791626, "regret": 0.35110628604888916, "entropy": 0.07231957465410233, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:29:39.717226Z", "loop": 3261, "env_steps": 2004172799, "loss": 0.0009030710789375007, "avg_return": 0.46173036098480225, "regret": 0.35110628604888916, "entropy": 0.06706268340349197, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:29:40.877897Z", "loop": 3262, "env_steps": 2004787199, "loss": 0.0008210371597670019, "avg_return": 0.46001526713371277, "regret": 0.35110628604888916, "entropy": 0.06686247885227203, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:29:42.039190Z", "loop": 3263, "env_steps": 2005401599, "loss": 0.0008047955925576389, "avg_return": 0.45104026794433594, "regret": 0.35110628604888916, "entropy": 0.07337874174118042, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:29:43.199351Z", "loop": 3264, "env_steps": 2006015999, "loss": 0.0007951011066325009, "avg_return": 0.4497092664241791, "regret": 0.35110628604888916, "entropy": 0.07072364538908005, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:29:44.360486Z", "loop": 3265, "env_steps": 2006630399, "loss": 0.000682214624248445, "avg_return": 0.4598981738090515, "regret": 0.35110628604888916, "entropy": 0.0680236965417862, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:29:45.520812Z", "loop": 3266, "env_steps": 2007244799, "loss": 0.00044159902608953416, "avg_return": 0.44633230566978455, "regret": 0.35110628604888916, "entropy": 0.06765934079885483, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:29:46.681733Z", "loop": 3267, "env_steps": 2007859199, "loss": 0.0005843718536198139, "avg_return": 0.44898882508277893, "regret": 0.35110628604888916, "entropy": 0.0609576590359211, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:29:47.843327Z", "loop": 3268, "env_steps": 2008473599, "loss": 0.0005075828521512449, "avg_return": 0.4504982531070709, "regret": 0.35110628604888916, "entropy": 0.062145788222551346, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:29:49.004307Z", "loop": 3269, "env_steps": 2009087999, "loss": 0.0006039826548658311, "avg_return": 0.4596033990383148, "regret": 0.35110628604888916, "entropy": 0.06208278611302376, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:29:50.211681Z", "loop": 3270, "env_steps": 2009702399, "loss": 0.0006474446854554117, "avg_return": 0.4489445090293884, "regret": 0.35078099370002747, "entropy": 0.0637378916144371, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:29:51.373198Z", "loop": 3271, "env_steps": 2010316799, "loss": 0.0006857860716991127, "avg_return": 0.45312583446502686, "regret": 0.35078099370002747, "entropy": 0.0634959265589714, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:29:52.534593Z", "loop": 3272, "env_steps": 2010931199, "loss": 0.0006469014915637672, "avg_return": 0.45356762409210205, "regret": 0.35078099370002747, "entropy": 0.065658800303936, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:29:53.694619Z", "loop": 3273, "env_steps": 2011545599, "loss": 0.0005884572747163475, "avg_return": 0.45152395963668823, "regret": 0.35078099370002747, "entropy": 0.061575524508953094, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:29:54.855672Z", "loop": 3274, "env_steps": 2012159999, "loss": 0.0006292979815043509, "avg_return": 0.44139528274536133, "regret": 0.35078099370002747, "entropy": 0.06883782148361206, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:29:56.015652Z", "loop": 3275, "env_steps": 2012774399, "loss": 0.0005773535231128335, "avg_return": 0.450558066368103, "regret": 0.35078099370002747, "entropy": 0.06373550742864609, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:29:57.176147Z", "loop": 3276, "env_steps": 2013388799, "loss": 0.0005520211416296661, "avg_return": 0.44775381684303284, "regret": 0.35078099370002747, "entropy": 0.06468991935253143, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:29:58.337643Z", "loop": 3277, "env_steps": 2014003199, "loss": 0.0004869178810622543, "avg_return": 0.45011332631111145, "regret": 0.35078099370002747, "entropy": 0.06687326729297638, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:29:59.498484Z", "loop": 3278, "env_steps": 2014617599, "loss": 0.0006710920133627951, "avg_return": 0.4586319029331207, "regret": 0.35078099370002747, "entropy": 0.0716535747051239, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:30:00.660005Z", "loop": 3279, "env_steps": 2015231999, "loss": 0.0006332574994303286, "avg_return": 0.45315995812416077, "regret": 0.35078099370002747, "entropy": 0.0589788444340229, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:30:01.865138Z", "loop": 3280, "env_steps": 2015846399, "loss": 0.000669284665491432, "avg_return": 0.4544062316417694, "regret": 0.3507027328014374, "entropy": 0.06831318885087967, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:30:03.027114Z", "loop": 3281, "env_steps": 2016460799, "loss": 0.0006664035608991981, "avg_return": 0.4519153833389282, "regret": 0.3507027328014374, "entropy": 0.0688728392124176, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:30:04.190272Z", "loop": 3282, "env_steps": 2017075199, "loss": 0.0006229159771464765, "avg_return": 0.4487377107143402, "regret": 0.3507027328014374, "entropy": 0.07242349535226822, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:30:05.351207Z", "loop": 3283, "env_steps": 2017689599, "loss": 0.0007402195478789508, "avg_return": 0.4562057554721832, "regret": 0.3507027328014374, "entropy": 0.07259576767683029, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:30:06.511494Z", "loop": 3284, "env_steps": 2018303999, "loss": 0.0008837942150421441, "avg_return": 0.4553593695163727, "regret": 0.3507027328014374, "entropy": 0.07303018867969513, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:30:07.671949Z", "loop": 3285, "env_steps": 2018918399, "loss": 0.0007690451457165182, "avg_return": 0.45353323221206665, "regret": 0.3507027328014374, "entropy": 0.07242313027381897, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:30:08.834741Z", "loop": 3286, "env_steps": 2019532799, "loss": 0.0006730243330821395, "avg_return": 0.4551815986633301, "regret": 0.3507027328014374, "entropy": 0.0656750500202179, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:30:09.996700Z", "loop": 3287, "env_steps": 2020147199, "loss": 0.0006061827298253775, "avg_return": 0.4528968334197998, "regret": 0.3507027328014374, "entropy": 0.06625930964946747, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:30:11.157902Z", "loop": 3288, "env_steps": 2020761599, "loss": 0.0005933462525717914, "avg_return": 0.4548835754394531, "regret": 0.3507027328014374, "entropy": 0.06341253966093063, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:30:12.317873Z", "loop": 3289, "env_steps": 2021375999, "loss": 0.0006410999922081828, "avg_return": 0.45349204540252686, "regret": 0.3507027328014374, "entropy": 0.06394749134778976, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:30:13.533337Z", "loop": 3290, "env_steps": 2021990399, "loss": 0.0005723278736695647, "avg_return": 0.4553636312484741, "regret": 0.35063478350639343, "entropy": 0.06516638398170471, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:30:14.693969Z", "loop": 3291, "env_steps": 2022604799, "loss": 0.0006754546775482595, "avg_return": 0.4511522054672241, "regret": 0.35063478350639343, "entropy": 0.0625251978635788, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:30:15.855859Z", "loop": 3292, "env_steps": 2023219199, "loss": 0.0007027186802588403, "avg_return": 0.44908833503723145, "regret": 0.35063478350639343, "entropy": 0.0643085464835167, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:30:17.017684Z", "loop": 3293, "env_steps": 2023833599, "loss": 0.0006165254744701087, "avg_return": 0.45518845319747925, "regret": 0.35063478350639343, "entropy": 0.061633218079805374, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:30:18.178659Z", "loop": 3294, "env_steps": 2024447999, "loss": 0.0006796458619646728, "avg_return": 0.45162954926490784, "regret": 0.35063478350639343, "entropy": 0.0675276443362236, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:30:19.340346Z", "loop": 3295, "env_steps": 2025062399, "loss": 0.0005726983654312789, "avg_return": 0.4534190595149994, "regret": 0.35063478350639343, "entropy": 0.06835134327411652, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:30:20.500802Z", "loop": 3296, "env_steps": 2025676799, "loss": 0.0007164729759097099, "avg_return": 0.4491558074951172, "regret": 0.35063478350639343, "entropy": 0.06498327106237411, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:30:21.662240Z", "loop": 3297, "env_steps": 2026291199, "loss": 0.0007405228679999709, "avg_return": 0.46515554189682007, "regret": 0.35063478350639343, "entropy": 0.060680802911520004, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:30:22.823924Z", "loop": 3298, "env_steps": 2026905599, "loss": 0.0007491169380955398, "avg_return": 0.4569990038871765, "regret": 0.35063478350639343, "entropy": 0.06459537893533707, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:30:23.984930Z", "loop": 3299, "env_steps": 2027519999, "loss": 0.000773911364376545, "avg_return": 0.4431256353855133, "regret": 0.35063478350639343, "entropy": 0.06846814602613449, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:30:25.192158Z", "loop": 3300, "env_steps": 2028134399, "loss": 0.000981128541752696, "avg_return": 0.4542391002178192, "regret": 0.35068899393081665, "entropy": 0.07193323224782944, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:30:26.353291Z", "loop": 3301, "env_steps": 2028748799, "loss": 0.0009857667610049248, "avg_return": 0.4523886740207672, "regret": 0.35068899393081665, "entropy": 0.07419636100530624, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:30:27.515425Z", "loop": 3302, "env_steps": 2029363199, "loss": 0.001389106153510511, "avg_return": 0.4527122974395752, "regret": 0.35068899393081665, "entropy": 0.07035696506500244, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:30:28.676729Z", "loop": 3303, "env_steps": 2029977599, "loss": 0.0014659337466582656, "avg_return": 0.44530752301216125, "regret": 0.35068899393081665, "entropy": 0.07323712855577469, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:30:29.839622Z", "loop": 3304, "env_steps": 2030591999, "loss": 0.001831706496886909, "avg_return": 0.4582218527793884, "regret": 0.35068899393081665, "entropy": 0.08009136468172073, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:30:31.000981Z", "loop": 3305, "env_steps": 2031206399, "loss": 0.002286301227286458, "avg_return": 0.4570392072200775, "regret": 0.35068899393081665, "entropy": 0.08691515773534775, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:30:32.163387Z", "loop": 3306, "env_steps": 2031820799, "loss": 0.002316779224202037, "avg_return": 0.44838330149650574, "regret": 0.35068899393081665, "entropy": 0.08620266616344452, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:30:33.325119Z", "loop": 3307, "env_steps": 2032435199, "loss": 0.0025891351979225874, "avg_return": 0.45318377017974854, "regret": 0.35068899393081665, "entropy": 0.09178918600082397, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:30:34.485733Z", "loop": 3308, "env_steps": 2033049599, "loss": 0.0027116918936371803, "avg_return": 0.4443613290786743, "regret": 0.35068899393081665, "entropy": 0.08767671883106232, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:30:35.647331Z", "loop": 3309, "env_steps": 2033663999, "loss": 0.002698237542062998, "avg_return": 0.4432874023914337, "regret": 0.35068899393081665, "entropy": 0.08988375216722488, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:30:36.855125Z", "loop": 3310, "env_steps": 2034278399, "loss": 0.0033288977574557066, "avg_return": 0.44338110089302063, "regret": 0.3616752028465271, "entropy": 0.0895204022526741, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:30:38.016953Z", "loop": 3311, "env_steps": 2034892799, "loss": 0.003151532029733062, "avg_return": 0.4373719394207001, "regret": 0.3616752028465271, "entropy": 0.09258327633142471, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:30:39.178233Z", "loop": 3312, "env_steps": 2035507199, "loss": 0.0029910316225141287, "avg_return": 0.44980743527412415, "regret": 0.3616752028465271, "entropy": 0.08546732366085052, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:30:40.342572Z", "loop": 3313, "env_steps": 2036121599, "loss": 0.0027541278395801783, "avg_return": 0.44730520248413086, "regret": 0.3616752028465271, "entropy": 0.08066559582948685, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:30:41.505148Z", "loop": 3314, "env_steps": 2036735999, "loss": 0.002376557094976306, "avg_return": 0.4514450132846832, "regret": 0.3616752028465271, "entropy": 0.0726003497838974, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:30:42.667131Z", "loop": 3315, "env_steps": 2037350399, "loss": 0.0018958073342218995, "avg_return": 0.45317283272743225, "regret": 0.3616752028465271, "entropy": 0.06932386010885239, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:30:43.828722Z", "loop": 3316, "env_steps": 2037964799, "loss": 0.0017248549265787005, "avg_return": 0.4553133249282837, "regret": 0.3616752028465271, "entropy": 0.07192067056894302, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:30:44.989040Z", "loop": 3317, "env_steps": 2038579199, "loss": 0.0012836450478062034, "avg_return": 0.45573487877845764, "regret": 0.3616752028465271, "entropy": 0.06470349431037903, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:30:46.150148Z", "loop": 3318, "env_steps": 2039193599, "loss": 0.0013153799809515476, "avg_return": 0.45056962966918945, "regret": 0.3616752028465271, "entropy": 0.06859634816646576, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:30:47.314914Z", "loop": 3319, "env_steps": 2039807999, "loss": 0.0011632625246420503, "avg_return": 0.4526546895503998, "regret": 0.3616752028465271, "entropy": 0.0626344159245491, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:30:48.522377Z", "loop": 3320, "env_steps": 2040422399, "loss": 0.0010699030244722962, "avg_return": 0.4520139694213867, "regret": 0.3506966531276703, "entropy": 0.06024986878037453, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:30:49.684061Z", "loop": 3321, "env_steps": 2041036799, "loss": 0.001122961868532002, "avg_return": 0.46261128783226013, "regret": 0.3506966531276703, "entropy": 0.06125636398792267, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:30:50.846665Z", "loop": 3322, "env_steps": 2041651199, "loss": 0.0011709310347214341, "avg_return": 0.45555251836776733, "regret": 0.3506966531276703, "entropy": 0.05509479343891144, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:30:52.012041Z", "loop": 3323, "env_steps": 2042265599, "loss": 0.00078673439566046, "avg_return": 0.45052632689476013, "regret": 0.3506966531276703, "entropy": 0.05990798771381378, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:30:53.174336Z", "loop": 3324, "env_steps": 2042879999, "loss": 0.0010617049410939217, "avg_return": 0.45189282298088074, "regret": 0.3506966531276703, "entropy": 0.060227930545806885, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:30:54.337067Z", "loop": 3325, "env_steps": 2043494399, "loss": 0.0009626272949390113, "avg_return": 0.45883113145828247, "regret": 0.3506966531276703, "entropy": 0.06717785447835922, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:30:55.498325Z", "loop": 3326, "env_steps": 2044108799, "loss": 0.0012173036811873317, "avg_return": 0.45541414618492126, "regret": 0.3506966531276703, "entropy": 0.06940559297800064, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:30:56.661099Z", "loop": 3327, "env_steps": 2044723199, "loss": 0.0011273011332377791, "avg_return": 0.4506806433200836, "regret": 0.3506966531276703, "entropy": 0.05945828929543495, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:30:57.822996Z", "loop": 3328, "env_steps": 2045337599, "loss": 0.0008955858647823334, "avg_return": 0.4435674250125885, "regret": 0.3506966531276703, "entropy": 0.06584694236516953, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:30:58.984270Z", "loop": 3329, "env_steps": 2045951999, "loss": 0.0008156276308000088, "avg_return": 0.4484233856201172, "regret": 0.3506966531276703, "entropy": 0.06195628270506859, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:31:00.193352Z", "loop": 3330, "env_steps": 2046566399, "loss": 0.000967842002864927, "avg_return": 0.44851920008659363, "regret": 0.3510775864124298, "entropy": 0.06623265147209167, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:31:01.355530Z", "loop": 3331, "env_steps": 2047180799, "loss": 0.0009991357801482081, "avg_return": 0.4591875374317169, "regret": 0.3510775864124298, "entropy": 0.06565601378679276, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:31:02.517609Z", "loop": 3332, "env_steps": 2047795199, "loss": 0.0012043764581903815, "avg_return": 0.4540847837924957, "regret": 0.3510775864124298, "entropy": 0.06562232971191406, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:31:03.677501Z", "loop": 3333, "env_steps": 2048409599, "loss": 0.001088765449821949, "avg_return": 0.45310208201408386, "regret": 0.3510775864124298, "entropy": 0.05432334169745445, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:31:04.838639Z", "loop": 3334, "env_steps": 2049023999, "loss": 0.0011774961603805423, "avg_return": 0.4578947126865387, "regret": 0.3510775864124298, "entropy": 0.05101842060685158, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:31:06.000089Z", "loop": 3335, "env_steps": 2049638399, "loss": 0.001418373198248446, "avg_return": 0.45854493975639343, "regret": 0.3510775864124298, "entropy": 0.05651765316724777, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:31:07.161458Z", "loop": 3336, "env_steps": 2050252799, "loss": 0.002319454215466976, "avg_return": 0.4635518491268158, "regret": 0.3510775864124298, "entropy": 0.06339318305253983, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:31:08.323047Z", "loop": 3337, "env_steps": 2050867199, "loss": 0.0023883904796093702, "avg_return": 0.45592835545539856, "regret": 0.3510775864124298, "entropy": 0.07053408026695251, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:31:09.489784Z", "loop": 3338, "env_steps": 2051481599, "loss": 0.0030052007641643286, "avg_return": 0.4541374742984772, "regret": 0.3510775864124298, "entropy": 0.07422567903995514, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:31:10.651130Z", "loop": 3339, "env_steps": 2052095999, "loss": 0.002773058833554387, "avg_return": 0.4540994465351105, "regret": 0.3510775864124298, "entropy": 0.07177652418613434, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:31:11.859266Z", "loop": 3340, "env_steps": 2052710399, "loss": 0.0030217613093554974, "avg_return": 0.4559227526187897, "regret": 0.3520970046520233, "entropy": 0.07344729453325272, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:31:13.020512Z", "loop": 3341, "env_steps": 2053324799, "loss": 0.0023964964784681797, "avg_return": 0.4509519934654236, "regret": 0.3520970046520233, "entropy": 0.06399057060480118, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:31:14.180866Z", "loop": 3342, "env_steps": 2053939199, "loss": 0.0016775954281911254, "avg_return": 0.4566101133823395, "regret": 0.3520970046520233, "entropy": 0.05218332260847092, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:31:15.341935Z", "loop": 3343, "env_steps": 2054553599, "loss": 0.0013438996393233538, "avg_return": 0.4528714120388031, "regret": 0.3520970046520233, "entropy": 0.05073223635554314, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:31:16.503993Z", "loop": 3344, "env_steps": 2055167999, "loss": 0.0009687226265668869, "avg_return": 0.4582307040691376, "regret": 0.3520970046520233, "entropy": 0.048303958028554916, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:31:17.664763Z", "loop": 3345, "env_steps": 2055782399, "loss": 0.001028523431159556, "avg_return": 0.4528607428073883, "regret": 0.3520970046520233, "entropy": 0.050520025193691254, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:31:18.826876Z", "loop": 3346, "env_steps": 2056396799, "loss": 0.000934201932977885, "avg_return": 0.4520294666290283, "regret": 0.3520970046520233, "entropy": 0.05597233027219772, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:31:19.987441Z", "loop": 3347, "env_steps": 2057011199, "loss": 0.0012394757941365242, "avg_return": 0.45532745122909546, "regret": 0.3520970046520233, "entropy": 0.056570228189229965, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:31:21.148352Z", "loop": 3348, "env_steps": 2057625599, "loss": 0.0011972598731517792, "avg_return": 0.45560720562934875, "regret": 0.3520970046520233, "entropy": 0.06030320003628731, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:31:22.310213Z", "loop": 3349, "env_steps": 2058239999, "loss": 0.0010712499497458339, "avg_return": 0.4498039782047272, "regret": 0.3520970046520233, "entropy": 0.06597147136926651, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:31:23.515211Z", "loop": 3350, "env_steps": 2058854399, "loss": 0.0010413221316412091, "avg_return": 0.45228713750839233, "regret": 0.35095229744911194, "entropy": 0.05565136298537254, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:31:24.676662Z", "loop": 3351, "env_steps": 2059468799, "loss": 0.0007456957246176898, "avg_return": 0.4492003917694092, "regret": 0.35095229744911194, "entropy": 0.058500293642282486, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:31:25.837719Z", "loop": 3352, "env_steps": 2060083199, "loss": 0.0007055148016661406, "avg_return": 0.45224934816360474, "regret": 0.35095229744911194, "entropy": 0.0622057244181633, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:31:26.999520Z", "loop": 3353, "env_steps": 2060697599, "loss": 0.0006721948739141226, "avg_return": 0.44622859358787537, "regret": 0.35095229744911194, "entropy": 0.0587090402841568, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:31:28.163296Z", "loop": 3354, "env_steps": 2061311999, "loss": 0.0008404319523833692, "avg_return": 0.4544388949871063, "regret": 0.35095229744911194, "entropy": 0.05790194123983383, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:31:29.325089Z", "loop": 3355, "env_steps": 2061926399, "loss": 0.000848562631290406, "avg_return": 0.452085018157959, "regret": 0.35095229744911194, "entropy": 0.057488374412059784, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:31:30.486456Z", "loop": 3356, "env_steps": 2062540799, "loss": 0.0010166186839342117, "avg_return": 0.45391806960105896, "regret": 0.35095229744911194, "entropy": 0.062135934829711914, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:31:31.647069Z", "loop": 3357, "env_steps": 2063155199, "loss": 0.0012434646487236023, "avg_return": 0.45526641607284546, "regret": 0.35095229744911194, "entropy": 0.06429082900285721, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:31:32.811499Z", "loop": 3358, "env_steps": 2063769599, "loss": 0.001149179064668715, "avg_return": 0.45139771699905396, "regret": 0.35095229744911194, "entropy": 0.06409058719873428, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:31:33.974761Z", "loop": 3359, "env_steps": 2064383999, "loss": 0.0007733850507065654, "avg_return": 0.45017918944358826, "regret": 0.35095229744911194, "entropy": 0.0610627755522728, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:31:35.186226Z", "loop": 3360, "env_steps": 2064998399, "loss": 0.0005760888452641666, "avg_return": 0.44564658403396606, "regret": 0.3518311679363251, "entropy": 0.05808325856924057, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:31:36.347065Z", "loop": 3361, "env_steps": 2065612799, "loss": 0.00057302659843117, "avg_return": 0.45483121275901794, "regret": 0.3518311679363251, "entropy": 0.05892489105463028, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:31:37.508660Z", "loop": 3362, "env_steps": 2066227199, "loss": 0.0006597178289666772, "avg_return": 0.45172882080078125, "regret": 0.3518311679363251, "entropy": 0.06714686006307602, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:31:38.668238Z", "loop": 3363, "env_steps": 2066841599, "loss": 0.0010875294683501124, "avg_return": 0.45396146178245544, "regret": 0.3518311679363251, "entropy": 0.06776274740695953, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:31:39.833013Z", "loop": 3364, "env_steps": 2067455999, "loss": 0.0012013008818030357, "avg_return": 0.45409008860588074, "regret": 0.3518311679363251, "entropy": 0.06919695436954498, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:31:41.002225Z", "loop": 3365, "env_steps": 2068070399, "loss": 0.0016385391354560852, "avg_return": 0.45285162329673767, "regret": 0.3518311679363251, "entropy": 0.07717196643352509, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:31:42.164279Z", "loop": 3366, "env_steps": 2068684799, "loss": 0.0016583234537392855, "avg_return": 0.4534813165664673, "regret": 0.3518311679363251, "entropy": 0.0775320753455162, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:31:43.326663Z", "loop": 3367, "env_steps": 2069299199, "loss": 0.001699200482107699, "avg_return": 0.45754292607307434, "regret": 0.3518311679363251, "entropy": 0.07833094149827957, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:31:44.489303Z", "loop": 3368, "env_steps": 2069913599, "loss": 0.0019089553970843554, "avg_return": 0.4508839547634125, "regret": 0.3518311679363251, "entropy": 0.08476461470127106, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:31:45.650942Z", "loop": 3369, "env_steps": 2070527999, "loss": 0.0016776713309809566, "avg_return": 0.4514102339744568, "regret": 0.3518311679363251, "entropy": 0.07630638778209686, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:31:46.861532Z", "loop": 3370, "env_steps": 2071142399, "loss": 0.001345049007795751, "avg_return": 0.45695599913597107, "regret": 0.352220356464386, "entropy": 0.07125110924243927, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:31:48.028098Z", "loop": 3371, "env_steps": 2071756799, "loss": 0.001076397835277021, "avg_return": 0.44858449697494507, "regret": 0.352220356464386, "entropy": 0.0665711909532547, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:31:49.192953Z", "loop": 3372, "env_steps": 2072371199, "loss": 0.0007637140806764364, "avg_return": 0.4440699815750122, "regret": 0.352220356464386, "entropy": 0.061931312084198, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:31:50.353963Z", "loop": 3373, "env_steps": 2072985599, "loss": 0.0007755189435556531, "avg_return": 0.45754024386405945, "regret": 0.352220356464386, "entropy": 0.05351713299751282, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:31:51.515369Z", "loop": 3374, "env_steps": 2073599999, "loss": 0.0005347798578441143, "avg_return": 0.4493839740753174, "regret": 0.352220356464386, "entropy": 0.055349092930555344, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:31:52.676732Z", "loop": 3375, "env_steps": 2074214399, "loss": 0.0005581681616604328, "avg_return": 0.4562641382217407, "regret": 0.352220356464386, "entropy": 0.056994181126356125, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:31:53.837613Z", "loop": 3376, "env_steps": 2074828799, "loss": 0.0006166015518829226, "avg_return": 0.45803141593933105, "regret": 0.352220356464386, "entropy": 0.05508042499423027, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:31:54.999252Z", "loop": 3377, "env_steps": 2075443199, "loss": 0.0004894191515631974, "avg_return": 0.4589102864265442, "regret": 0.352220356464386, "entropy": 0.060356609523296356, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:31:56.161464Z", "loop": 3378, "env_steps": 2076057599, "loss": 0.0005015604547224939, "avg_return": 0.4516910910606384, "regret": 0.352220356464386, "entropy": 0.06187712028622627, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:31:57.328021Z", "loop": 3379, "env_steps": 2076671999, "loss": 0.0005056465161032975, "avg_return": 0.45793235301971436, "regret": 0.352220356464386, "entropy": 0.05864660069346428, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:31:58.538925Z", "loop": 3380, "env_steps": 2077286399, "loss": 0.000560498796403408, "avg_return": 0.45486441254615784, "regret": 0.35096800327301025, "entropy": 0.05711046978831291, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:31:59.700618Z", "loop": 3381, "env_steps": 2077900799, "loss": 0.0005533306393772364, "avg_return": 0.4567883312702179, "regret": 0.35096800327301025, "entropy": 0.056588150560855865, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:32:00.863139Z", "loop": 3382, "env_steps": 2078515199, "loss": 0.0005552055081352592, "avg_return": 0.4552037715911865, "regret": 0.35096800327301025, "entropy": 0.05715683475136757, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:32:02.023608Z", "loop": 3383, "env_steps": 2079129599, "loss": 0.0005574416718445718, "avg_return": 0.45280590653419495, "regret": 0.35096800327301025, "entropy": 0.05570283904671669, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:32:03.185289Z", "loop": 3384, "env_steps": 2079743999, "loss": 0.0005393199971877038, "avg_return": 0.45543956756591797, "regret": 0.35096800327301025, "entropy": 0.06067374348640442, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:32:04.345088Z", "loop": 3385, "env_steps": 2080358399, "loss": 0.0005978936678729951, "avg_return": 0.45756837725639343, "regret": 0.35096800327301025, "entropy": 0.05440407618880272, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:32:05.506103Z", "loop": 3386, "env_steps": 2080972799, "loss": 0.0006651388830505311, "avg_return": 0.45188745856285095, "regret": 0.35096800327301025, "entropy": 0.05574497580528259, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:32:06.665679Z", "loop": 3387, "env_steps": 2081587199, "loss": 0.0007898997864685953, "avg_return": 0.44812601804733276, "regret": 0.35096800327301025, "entropy": 0.05563122779130936, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:32:07.825859Z", "loop": 3388, "env_steps": 2082201599, "loss": 0.0007696780958212912, "avg_return": 0.454654335975647, "regret": 0.35096800327301025, "entropy": 0.0551261380314827, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:32:08.987272Z", "loop": 3389, "env_steps": 2082815999, "loss": 0.0007740305154584348, "avg_return": 0.44606903195381165, "regret": 0.35096800327301025, "entropy": 0.06552913784980774, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:32:10.194763Z", "loop": 3390, "env_steps": 2083430399, "loss": 0.0006487165810540318, "avg_return": 0.4493389129638672, "regret": 0.35064759850502014, "entropy": 0.054777830839157104, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:32:11.359119Z", "loop": 3391, "env_steps": 2084044799, "loss": 0.0007472594152204692, "avg_return": 0.4490039646625519, "regret": 0.35064759850502014, "entropy": 0.05975588783621788, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:32:12.521336Z", "loop": 3392, "env_steps": 2084659199, "loss": 0.0006698399665765464, "avg_return": 0.4593425691127777, "regret": 0.35064759850502014, "entropy": 0.056066710501909256, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:32:13.685690Z", "loop": 3393, "env_steps": 2085273599, "loss": 0.0006833055522292852, "avg_return": 0.45408275723457336, "regret": 0.35064759850502014, "entropy": 0.05267403647303581, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:32:14.847461Z", "loop": 3394, "env_steps": 2085887999, "loss": 0.0005925358273088932, "avg_return": 0.4495266377925873, "regret": 0.35064759850502014, "entropy": 0.05812887102365494, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:32:16.009394Z", "loop": 3395, "env_steps": 2086502399, "loss": 0.0005079588736407459, "avg_return": 0.44691550731658936, "regret": 0.35064759850502014, "entropy": 0.058656297624111176, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:32:17.173487Z", "loop": 3396, "env_steps": 2087116799, "loss": 0.000610934104770422, "avg_return": 0.4525406062602997, "regret": 0.35064759850502014, "entropy": 0.051276400685310364, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:32:18.335425Z", "loop": 3397, "env_steps": 2087731199, "loss": 0.0005390431033447385, "avg_return": 0.45140859484672546, "regret": 0.35064759850502014, "entropy": 0.057121094316244125, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:32:19.496952Z", "loop": 3398, "env_steps": 2088345599, "loss": 0.0004600067622959614, "avg_return": 0.4515659809112549, "regret": 0.35064759850502014, "entropy": 0.05113237351179123, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:32:20.657193Z", "loop": 3399, "env_steps": 2088959999, "loss": 0.00048239619354717433, "avg_return": 0.45076411962509155, "regret": 0.35064759850502014, "entropy": 0.06411682814359665, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:32:21.865035Z", "loop": 3400, "env_steps": 2089574399, "loss": 0.00047220048145391047, "avg_return": 0.45399460196495056, "regret": 0.350678950548172, "entropy": 0.05066624656319618, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:32:23.026151Z", "loop": 3401, "env_steps": 2090188799, "loss": 0.000544512236956507, "avg_return": 0.45369523763656616, "regret": 0.350678950548172, "entropy": 0.0527891144156456, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:32:24.187798Z", "loop": 3402, "env_steps": 2090803199, "loss": 0.0005295317387208343, "avg_return": 0.45074281096458435, "regret": 0.350678950548172, "entropy": 0.05167480558156967, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:32:25.349178Z", "loop": 3403, "env_steps": 2091417599, "loss": 0.000619789061602205, "avg_return": 0.45556408166885376, "regret": 0.350678950548172, "entropy": 0.052442751824855804, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:32:26.510044Z", "loop": 3404, "env_steps": 2092031999, "loss": 0.0005113061051815748, "avg_return": 0.4558655023574829, "regret": 0.350678950548172, "entropy": 0.05257035791873932, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:32:27.672031Z", "loop": 3405, "env_steps": 2092646399, "loss": 0.00048583419993519783, "avg_return": 0.4512403607368469, "regret": 0.350678950548172, "entropy": 0.053068459033966064, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:32:28.836208Z", "loop": 3406, "env_steps": 2093260799, "loss": 0.0005951892817392945, "avg_return": 0.45884349942207336, "regret": 0.350678950548172, "entropy": 0.05521964654326439, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:32:29.999980Z", "loop": 3407, "env_steps": 2093875199, "loss": 0.0004933856544084847, "avg_return": 0.45079880952835083, "regret": 0.350678950548172, "entropy": 0.05588793754577637, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:32:31.163868Z", "loop": 3408, "env_steps": 2094489599, "loss": 0.0005610419320873916, "avg_return": 0.44641995429992676, "regret": 0.350678950548172, "entropy": 0.05767408385872841, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:32:32.324840Z", "loop": 3409, "env_steps": 2095103999, "loss": 0.00042913490324281156, "avg_return": 0.45262855291366577, "regret": 0.350678950548172, "entropy": 0.05321338400244713, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:32:33.537479Z", "loop": 3410, "env_steps": 2095718399, "loss": 0.00043821425060741603, "avg_return": 0.45699983835220337, "regret": 0.35059911012649536, "entropy": 0.054783664643764496, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:32:34.699631Z", "loop": 3411, "env_steps": 2096332799, "loss": 0.0004563478287309408, "avg_return": 0.4468913972377777, "regret": 0.35059911012649536, "entropy": 0.056042272597551346, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:32:35.861320Z", "loop": 3412, "env_steps": 2096947199, "loss": 0.00043162942165508866, "avg_return": 0.4499020576477051, "regret": 0.35059911012649536, "entropy": 0.059909529983997345, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:32:37.022260Z", "loop": 3413, "env_steps": 2097561599, "loss": 0.0005791594157926738, "avg_return": 0.45124462246894836, "regret": 0.35059911012649536, "entropy": 0.06234104558825493, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:32:38.183952Z", "loop": 3414, "env_steps": 2098175999, "loss": 0.0007920807111077011, "avg_return": 0.4517419934272766, "regret": 0.35059911012649536, "entropy": 0.055253129452466965, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:32:39.343885Z", "loop": 3415, "env_steps": 2098790399, "loss": 0.0010456112213432789, "avg_return": 0.45366185903549194, "regret": 0.35059911012649536, "entropy": 0.06065639108419418, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:32:40.505122Z", "loop": 3416, "env_steps": 2099404799, "loss": 0.0011782770743593574, "avg_return": 0.45464929938316345, "regret": 0.35059911012649536, "entropy": 0.06487413495779037, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:32:41.667184Z", "loop": 3417, "env_steps": 2100019199, "loss": 0.001597676076926291, "avg_return": 0.4510197639465332, "regret": 0.35059911012649536, "entropy": 0.07100038975477219, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:32:42.827583Z", "loop": 3418, "env_steps": 2100633599, "loss": 0.0014197592390701175, "avg_return": 0.4554687738418579, "regret": 0.35059911012649536, "entropy": 0.06490880995988846, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:32:43.993837Z", "loop": 3419, "env_steps": 2101247999, "loss": 0.0015113245462998748, "avg_return": 0.44696685671806335, "regret": 0.35059911012649536, "entropy": 0.06583555042743683, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:32:45.204582Z", "loop": 3420, "env_steps": 2101862399, "loss": 0.0018402524292469025, "avg_return": 0.452475905418396, "regret": 0.3508880138397217, "entropy": 0.07371808588504791, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:32:46.366010Z", "loop": 3421, "env_steps": 2102476799, "loss": 0.0019507193937897682, "avg_return": 0.44675955176353455, "regret": 0.3508880138397217, "entropy": 0.07913710922002792, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:32:47.526834Z", "loop": 3422, "env_steps": 2103091199, "loss": 0.0016799230361357331, "avg_return": 0.45574483275413513, "regret": 0.3508880138397217, "entropy": 0.07641638070344925, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:32:48.688925Z", "loop": 3423, "env_steps": 2103705599, "loss": 0.0015104778576642275, "avg_return": 0.4542374908924103, "regret": 0.3508880138397217, "entropy": 0.07409412413835526, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:32:49.850783Z", "loop": 3424, "env_steps": 2104319999, "loss": 0.0014450638554990292, "avg_return": 0.44988682866096497, "regret": 0.3508880138397217, "entropy": 0.06802418828010559, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:32:51.012044Z", "loop": 3425, "env_steps": 2104934399, "loss": 0.0013310814974829555, "avg_return": 0.45127442479133606, "regret": 0.3508880138397217, "entropy": 0.06816759705543518, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:32:52.174912Z", "loop": 3426, "env_steps": 2105548799, "loss": 0.0012151149567216635, "avg_return": 0.4538351595401764, "regret": 0.3508880138397217, "entropy": 0.06844697147607803, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:32:53.335102Z", "loop": 3427, "env_steps": 2106163199, "loss": 0.00134528789203614, "avg_return": 0.45475128293037415, "regret": 0.3508880138397217, "entropy": 0.07175063341856003, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:32:54.496508Z", "loop": 3428, "env_steps": 2106777599, "loss": 0.001463662483729422, "avg_return": 0.44553086161613464, "regret": 0.3508880138397217, "entropy": 0.0662284716963768, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:32:55.657882Z", "loop": 3429, "env_steps": 2107391999, "loss": 0.001813766430132091, "avg_return": 0.45042410492897034, "regret": 0.3508880138397217, "entropy": 0.07506152242422104, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:32:56.866436Z", "loop": 3430, "env_steps": 2108006399, "loss": 0.0017768644029274583, "avg_return": 0.4511995017528534, "regret": 0.3507302403450012, "entropy": 0.07547871023416519, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:32:58.030174Z", "loop": 3431, "env_steps": 2108620799, "loss": 0.0014613632811233401, "avg_return": 0.4501490294933319, "regret": 0.3507302403450012, "entropy": 0.07014501094818115, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:32:59.191045Z", "loop": 3432, "env_steps": 2109235199, "loss": 0.0012826028978452086, "avg_return": 0.45149263739585876, "regret": 0.3507302403450012, "entropy": 0.06615731865167618, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:33:00.352525Z", "loop": 3433, "env_steps": 2109849599, "loss": 0.0011902896221727133, "avg_return": 0.4480627179145813, "regret": 0.3507302403450012, "entropy": 0.06449128687381744, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:33:01.513663Z", "loop": 3434, "env_steps": 2110463999, "loss": 0.0009583791834302247, "avg_return": 0.45779532194137573, "regret": 0.3507302403450012, "entropy": 0.055663738399744034, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:33:02.675858Z", "loop": 3435, "env_steps": 2111078399, "loss": 0.000635908218100667, "avg_return": 0.45136791467666626, "regret": 0.3507302403450012, "entropy": 0.05625085160136223, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:33:03.836125Z", "loop": 3436, "env_steps": 2111692799, "loss": 0.000595333578530699, "avg_return": 0.4546242356300354, "regret": 0.3507302403450012, "entropy": 0.05734791234135628, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:33:04.997608Z", "loop": 3437, "env_steps": 2112307199, "loss": 0.0004802132025361061, "avg_return": 0.4566722810268402, "regret": 0.3507302403450012, "entropy": 0.056312888860702515, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:33:06.159461Z", "loop": 3438, "env_steps": 2112921599, "loss": 0.0006453351234085858, "avg_return": 0.4485238790512085, "regret": 0.3507302403450012, "entropy": 0.059497807174921036, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:33:07.322673Z", "loop": 3439, "env_steps": 2113535999, "loss": 0.0006997246528044343, "avg_return": 0.45222190022468567, "regret": 0.3507302403450012, "entropy": 0.057089053094387054, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:33:08.541091Z", "loop": 3440, "env_steps": 2114150399, "loss": 0.0006838533445261419, "avg_return": 0.4621468782424927, "regret": 0.35062533617019653, "entropy": 0.05896682292222977, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:33:09.701997Z", "loop": 3441, "env_steps": 2114764799, "loss": 0.000579421641305089, "avg_return": 0.45355236530303955, "regret": 0.35062533617019653, "entropy": 0.05774321034550667, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:33:10.863592Z", "loop": 3442, "env_steps": 2115379199, "loss": 0.0005500101251527667, "avg_return": 0.4497596323490143, "regret": 0.35062533617019653, "entropy": 0.06193547695875168, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:33:12.027247Z", "loop": 3443, "env_steps": 2115993599, "loss": 0.0005242086481302977, "avg_return": 0.45555350184440613, "regret": 0.35062533617019653, "entropy": 0.05710238590836525, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:33:13.191514Z", "loop": 3444, "env_steps": 2116607999, "loss": 0.0005012810579501092, "avg_return": 0.4557569622993469, "regret": 0.35062533617019653, "entropy": 0.05890750139951706, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:33:14.355210Z", "loop": 3445, "env_steps": 2117222399, "loss": 0.0005119580309838057, "avg_return": 0.45270779728889465, "regret": 0.35062533617019653, "entropy": 0.058276548981666565, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:33:15.516828Z", "loop": 3446, "env_steps": 2117836799, "loss": 0.0005578614654950798, "avg_return": 0.45685410499572754, "regret": 0.35062533617019653, "entropy": 0.059569891542196274, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:33:16.679880Z", "loop": 3447, "env_steps": 2118451199, "loss": 0.0005532358773052692, "avg_return": 0.45044007897377014, "regret": 0.35062533617019653, "entropy": 0.053859494626522064, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:33:17.843312Z", "loop": 3448, "env_steps": 2119065599, "loss": 0.0006230988074094057, "avg_return": 0.4580305218696594, "regret": 0.35062533617019653, "entropy": 0.05546354874968529, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:33:19.004735Z", "loop": 3449, "env_steps": 2119679999, "loss": 0.0004913550219498575, "avg_return": 0.4540867209434509, "regret": 0.35062533617019653, "entropy": 0.05553203821182251, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:33:20.218404Z", "loop": 3450, "env_steps": 2120294399, "loss": 0.0005846808198839426, "avg_return": 0.45275574922561646, "regret": 0.350638210773468, "entropy": 0.05253024399280548, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:33:21.381144Z", "loop": 3451, "env_steps": 2120908799, "loss": 0.0006288668373599648, "avg_return": 0.45875808596611023, "regret": 0.350638210773468, "entropy": 0.06002872809767723, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:33:22.544714Z", "loop": 3452, "env_steps": 2121523199, "loss": 0.0006098636658862233, "avg_return": 0.4470542371273041, "regret": 0.350638210773468, "entropy": 0.0579550676047802, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:33:23.706516Z", "loop": 3453, "env_steps": 2122137599, "loss": 0.0005655676359310746, "avg_return": 0.4509454071521759, "regret": 0.350638210773468, "entropy": 0.05544643849134445, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:33:24.868505Z", "loop": 3454, "env_steps": 2122751999, "loss": 0.0006455406546592712, "avg_return": 0.4548647105693817, "regret": 0.350638210773468, "entropy": 0.053913865238428116, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:33:26.030681Z", "loop": 3455, "env_steps": 2123366399, "loss": 0.0005414769984781742, "avg_return": 0.45021262764930725, "regret": 0.350638210773468, "entropy": 0.056667886674404144, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:33:27.192683Z", "loop": 3456, "env_steps": 2123980799, "loss": 0.0005886759608983994, "avg_return": 0.45102185010910034, "regret": 0.350638210773468, "entropy": 0.056042809039354324, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:33:28.356185Z", "loop": 3457, "env_steps": 2124595199, "loss": 0.0008759619668126106, "avg_return": 0.4639734923839569, "regret": 0.350638210773468, "entropy": 0.05607415363192558, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:33:29.517254Z", "loop": 3458, "env_steps": 2125209599, "loss": 0.0007681430433876812, "avg_return": 0.45464396476745605, "regret": 0.350638210773468, "entropy": 0.06294780969619751, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:33:30.678780Z", "loop": 3459, "env_steps": 2125823999, "loss": 0.0006926350179128349, "avg_return": 0.45013368129730225, "regret": 0.350638210773468, "entropy": 0.0560309924185276, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:33:31.887476Z", "loop": 3460, "env_steps": 2126438399, "loss": 0.0006849461933597922, "avg_return": 0.45639610290527344, "regret": 0.3506482243537903, "entropy": 0.051248639822006226, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:33:33.048502Z", "loop": 3461, "env_steps": 2127052799, "loss": 0.0007798405713401735, "avg_return": 0.45278340578079224, "regret": 0.3506482243537903, "entropy": 0.05426209792494774, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:33:34.211703Z", "loop": 3462, "env_steps": 2127667199, "loss": 0.0006532957195304334, "avg_return": 0.44860678911209106, "regret": 0.3506482243537903, "entropy": 0.0580885149538517, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:33:35.371936Z", "loop": 3463, "env_steps": 2128281599, "loss": 0.0007332732202485204, "avg_return": 0.45772916078567505, "regret": 0.3506482243537903, "entropy": 0.0583866611123085, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:33:36.534047Z", "loop": 3464, "env_steps": 2128895999, "loss": 0.0006623363588005304, "avg_return": 0.45842602849006653, "regret": 0.3506482243537903, "entropy": 0.055082641541957855, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:33:37.695537Z", "loop": 3465, "env_steps": 2129510399, "loss": 0.0010320296278223395, "avg_return": 0.45088991522789, "regret": 0.3506482243537903, "entropy": 0.05983676388859749, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:33:38.860001Z", "loop": 3466, "env_steps": 2130124799, "loss": 0.0011081701377406716, "avg_return": 0.45690008997917175, "regret": 0.3506482243537903, "entropy": 0.060627054423093796, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:33:40.021555Z", "loop": 3467, "env_steps": 2130739199, "loss": 0.0011062490520998836, "avg_return": 0.45306897163391113, "regret": 0.3506482243537903, "entropy": 0.0636088103055954, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:33:41.182500Z", "loop": 3468, "env_steps": 2131353599, "loss": 0.0012313410406932235, "avg_return": 0.4507330060005188, "regret": 0.3506482243537903, "entropy": 0.06470949947834015, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:33:42.344777Z", "loop": 3469, "env_steps": 2131967999, "loss": 0.0012672458542510867, "avg_return": 0.44810640811920166, "regret": 0.3506482243537903, "entropy": 0.06542154401540756, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:33:43.559368Z", "loop": 3470, "env_steps": 2132582399, "loss": 0.0011305772932246327, "avg_return": 0.4543139338493347, "regret": 0.35070133209228516, "entropy": 0.06439895927906036, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:33:44.725593Z", "loop": 3471, "env_steps": 2133196799, "loss": 0.0011507170274853706, "avg_return": 0.45603853464126587, "regret": 0.35070133209228516, "entropy": 0.06566682457923889, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:33:45.886263Z", "loop": 3472, "env_steps": 2133811199, "loss": 0.000771589984651655, "avg_return": 0.458173543214798, "regret": 0.35070133209228516, "entropy": 0.05879763886332512, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:33:47.047991Z", "loop": 3473, "env_steps": 2134425599, "loss": 0.0006513852276839316, "avg_return": 0.4565868377685547, "regret": 0.35070133209228516, "entropy": 0.05637863650918007, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:33:48.210006Z", "loop": 3474, "env_steps": 2135039999, "loss": 0.0005086538731120527, "avg_return": 0.4556259214878082, "regret": 0.35070133209228516, "entropy": 0.06042156368494034, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:33:49.372721Z", "loop": 3475, "env_steps": 2135654399, "loss": 0.00032209217897616327, "avg_return": 0.4535152316093445, "regret": 0.35070133209228516, "entropy": 0.05492516607046127, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:33:50.535657Z", "loop": 3476, "env_steps": 2136268799, "loss": 0.0004342047614045441, "avg_return": 0.4604351818561554, "regret": 0.35070133209228516, "entropy": 0.056313157081604004, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:33:51.698922Z", "loop": 3477, "env_steps": 2136883199, "loss": 0.00044367212103679776, "avg_return": 0.45417195558547974, "regret": 0.35070133209228516, "entropy": 0.05015508085489273, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:33:52.860194Z", "loop": 3478, "env_steps": 2137497599, "loss": 0.0005577268893830478, "avg_return": 0.45037198066711426, "regret": 0.35070133209228516, "entropy": 0.05375618487596512, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:33:54.022320Z", "loop": 3479, "env_steps": 2138111999, "loss": 0.0005576236872002482, "avg_return": 0.4498937726020813, "regret": 0.35070133209228516, "entropy": 0.059398114681243896, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:33:55.231010Z", "loop": 3480, "env_steps": 2138726399, "loss": 0.0006688518915325403, "avg_return": 0.45511430501937866, "regret": 0.3505755066871643, "entropy": 0.060566771775484085, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:33:56.392931Z", "loop": 3481, "env_steps": 2139340799, "loss": 0.0009626300306990743, "avg_return": 0.4514583349227905, "regret": 0.3505755066871643, "entropy": 0.05642998591065407, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:33:57.554289Z", "loop": 3482, "env_steps": 2139955199, "loss": 0.0008543715812265873, "avg_return": 0.4517991244792938, "regret": 0.3505755066871643, "entropy": 0.06496315449476242, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:33:58.715777Z", "loop": 3483, "env_steps": 2140569599, "loss": 0.0014453997137024999, "avg_return": 0.4567657709121704, "regret": 0.3505755066871643, "entropy": 0.06849926710128784, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:33:59.876236Z", "loop": 3484, "env_steps": 2141183999, "loss": 0.0016754083335399628, "avg_return": 0.4583103656768799, "regret": 0.3505755066871643, "entropy": 0.06929904967546463, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:34:01.037529Z", "loop": 3485, "env_steps": 2141798399, "loss": 0.0018975958228111267, "avg_return": 0.4559883177280426, "regret": 0.3505755066871643, "entropy": 0.0684514194726944, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:34:02.197858Z", "loop": 3486, "env_steps": 2142412799, "loss": 0.001616092980839312, "avg_return": 0.4506947994232178, "regret": 0.3505755066871643, "entropy": 0.06763045489788055, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:34:03.358358Z", "loop": 3487, "env_steps": 2143027199, "loss": 0.00179202388972044, "avg_return": 0.4505154490470886, "regret": 0.3505755066871643, "entropy": 0.06880505383014679, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:34:04.519572Z", "loop": 3488, "env_steps": 2143641599, "loss": 0.0015270182630047202, "avg_return": 0.45512568950653076, "regret": 0.3505755066871643, "entropy": 0.06553959101438522, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:34:05.680431Z", "loop": 3489, "env_steps": 2144255999, "loss": 0.0014960098778828979, "avg_return": 0.4500678479671478, "regret": 0.3505755066871643, "entropy": 0.0700179934501648, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:34:06.886155Z", "loop": 3490, "env_steps": 2144870399, "loss": 0.0016476825112476945, "avg_return": 0.45911428332328796, "regret": 0.3506561815738678, "entropy": 0.0656626969575882, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:34:08.047581Z", "loop": 3491, "env_steps": 2145484799, "loss": 0.0016272178618237376, "avg_return": 0.4521598815917969, "regret": 0.3506561815738678, "entropy": 0.07365136593580246, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:34:09.209494Z", "loop": 3492, "env_steps": 2146099199, "loss": 0.001747813425026834, "avg_return": 0.4609542489051819, "regret": 0.3506561815738678, "entropy": 0.07042636722326279, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:34:10.370333Z", "loop": 3493, "env_steps": 2146713599, "loss": 0.001684881397522986, "avg_return": 0.46085649728775024, "regret": 0.3506561815738678, "entropy": 0.06739666312932968, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:34:11.532241Z", "loop": 3494, "env_steps": 2147327999, "loss": 0.0013007641537114978, "avg_return": 0.4487646520137787, "regret": 0.3506561815738678, "entropy": 0.06894011795520782, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:34:12.692562Z", "loop": 3495, "env_steps": 2147942399, "loss": 0.001575421541929245, "avg_return": 0.45225366950035095, "regret": 0.3506561815738678, "entropy": 0.06494147330522537, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:34:13.852956Z", "loop": 3496, "env_steps": 2148556799, "loss": 0.001479838858358562, "avg_return": 0.44813621044158936, "regret": 0.3506561815738678, "entropy": 0.07024899125099182, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:34:15.014221Z", "loop": 3497, "env_steps": 2149171199, "loss": 0.0017492184415459633, "avg_return": 0.45789897441864014, "regret": 0.3506561815738678, "entropy": 0.06782299280166626, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:34:16.174666Z", "loop": 3498, "env_steps": 2149785599, "loss": 0.002213152125477791, "avg_return": 0.4546048641204834, "regret": 0.3506561815738678, "entropy": 0.06836408376693726, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:34:17.336397Z", "loop": 3499, "env_steps": 2150399999, "loss": 0.0024523758329451084, "avg_return": 0.45703965425491333, "regret": 0.3506561815738678, "entropy": 0.06791061162948608, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:34:18.548928Z", "loop": 3500, "env_steps": 2151014399, "loss": 0.0022829046938568354, "avg_return": 0.45193207263946533, "regret": 0.3514961302280426, "entropy": 0.06276582926511765, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:34:19.710528Z", "loop": 3501, "env_steps": 2151628799, "loss": 0.002295249840244651, "avg_return": 0.45375093817710876, "regret": 0.3514961302280426, "entropy": 0.06098197400569916, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:34:20.871097Z", "loop": 3502, "env_steps": 2152243199, "loss": 0.0020252587273716927, "avg_return": 0.4533441662788391, "regret": 0.3514961302280426, "entropy": 0.06161060556769371, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:34:22.032466Z", "loop": 3503, "env_steps": 2152857599, "loss": 0.0021547763608396053, "avg_return": 0.44864320755004883, "regret": 0.3514961302280426, "entropy": 0.06220855191349983, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:34:23.194254Z", "loop": 3504, "env_steps": 2153471999, "loss": 0.0021270362194627523, "avg_return": 0.45280539989471436, "regret": 0.3514961302280426, "entropy": 0.05761834233999252, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:34:24.355402Z", "loop": 3505, "env_steps": 2154086399, "loss": 0.001988531555980444, "avg_return": 0.45452260971069336, "regret": 0.3514961302280426, "entropy": 0.05322740972042084, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:34:25.516944Z", "loop": 3506, "env_steps": 2154700799, "loss": 0.0016209654277190566, "avg_return": 0.45839861035346985, "regret": 0.3514961302280426, "entropy": 0.055954691022634506, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:34:26.677565Z", "loop": 3507, "env_steps": 2155315199, "loss": 0.0015654087765142322, "avg_return": 0.4517500400543213, "regret": 0.3514961302280426, "entropy": 0.0509362667798996, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:34:27.838886Z", "loop": 3508, "env_steps": 2155929599, "loss": 0.0012997603043913841, "avg_return": 0.4568536579608917, "regret": 0.3514961302280426, "entropy": 0.05012792348861694, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:34:28.999024Z", "loop": 3509, "env_steps": 2156543999, "loss": 0.0011553127551451325, "avg_return": 0.4583306610584259, "regret": 0.3514961302280426, "entropy": 0.04745003581047058, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:34:30.207964Z", "loop": 3510, "env_steps": 2157158399, "loss": 0.0011055483482778072, "avg_return": 0.45237183570861816, "regret": 0.3507862985134125, "entropy": 0.0480545237660408, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:34:31.369098Z", "loop": 3511, "env_steps": 2157772799, "loss": 0.0011721760965883732, "avg_return": 0.45738425850868225, "regret": 0.3507862985134125, "entropy": 0.049044061452150345, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:34:32.530156Z", "loop": 3512, "env_steps": 2158387199, "loss": 0.0012600355548784137, "avg_return": 0.45632457733154297, "regret": 0.3507862985134125, "entropy": 0.049245718866586685, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:34:33.691206Z", "loop": 3513, "env_steps": 2159001599, "loss": 0.0011685866629704833, "avg_return": 0.4526742100715637, "regret": 0.3507862985134125, "entropy": 0.04746915400028229, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:34:34.851542Z", "loop": 3514, "env_steps": 2159615999, "loss": 0.0011054964270442724, "avg_return": 0.45928528904914856, "regret": 0.3507862985134125, "entropy": 0.04737250134348869, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:34:36.012774Z", "loop": 3515, "env_steps": 2160230399, "loss": 0.0010070637799799442, "avg_return": 0.44338706135749817, "regret": 0.3507862985134125, "entropy": 0.048537302762269974, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:34:37.173088Z", "loop": 3516, "env_steps": 2160844799, "loss": 0.0014215687988325953, "avg_return": 0.4543646275997162, "regret": 0.3507862985134125, "entropy": 0.04867086187005043, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:34:38.333817Z", "loop": 3517, "env_steps": 2161459199, "loss": 0.0015565865905955434, "avg_return": 0.45686790347099304, "regret": 0.3507862985134125, "entropy": 0.051482830196619034, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:34:39.493762Z", "loop": 3518, "env_steps": 2162073599, "loss": 0.0014615508262068033, "avg_return": 0.4412330687046051, "regret": 0.3507862985134125, "entropy": 0.05494071543216705, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:34:40.654336Z", "loop": 3519, "env_steps": 2162687999, "loss": 0.001705390983261168, "avg_return": 0.4560261070728302, "regret": 0.3507862985134125, "entropy": 0.05313252657651901, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:34:41.874208Z", "loop": 3520, "env_steps": 2163302399, "loss": 0.0016110735014081001, "avg_return": 0.45138266682624817, "regret": 0.3511996567249298, "entropy": 0.05344152823090553, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:34:43.035924Z", "loop": 3521, "env_steps": 2163916799, "loss": 0.001777272904291749, "avg_return": 0.45246604084968567, "regret": 0.3511996567249298, "entropy": 0.054651889950037, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:34:44.198157Z", "loop": 3522, "env_steps": 2164531199, "loss": 0.0018631259445101023, "avg_return": 0.44858765602111816, "regret": 0.3511996567249298, "entropy": 0.059961605817079544, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:34:45.358755Z", "loop": 3523, "env_steps": 2165145599, "loss": 0.0023706138599663973, "avg_return": 0.4503776729106903, "regret": 0.3511996567249298, "entropy": 0.07093209773302078, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:34:46.520196Z", "loop": 3524, "env_steps": 2165759999, "loss": 0.0026540523394942284, "avg_return": 0.451668918132782, "regret": 0.3511996567249298, "entropy": 0.0709594264626503, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:34:47.682183Z", "loop": 3525, "env_steps": 2166374399, "loss": 0.002732137218117714, "avg_return": 0.44940897822380066, "regret": 0.3511996567249298, "entropy": 0.06929206848144531, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:34:48.842700Z", "loop": 3526, "env_steps": 2166988799, "loss": 0.0028322848957031965, "avg_return": 0.4537017047405243, "regret": 0.3511996567249298, "entropy": 0.0711631029844284, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:34:50.004286Z", "loop": 3527, "env_steps": 2167603199, "loss": 0.0026412277948111296, "avg_return": 0.4538475573062897, "regret": 0.3511996567249298, "entropy": 0.06693572551012039, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:34:51.165513Z", "loop": 3528, "env_steps": 2168217599, "loss": 0.0029962381813675165, "avg_return": 0.4516313672065735, "regret": 0.3511996567249298, "entropy": 0.07296890020370483, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:34:52.330079Z", "loop": 3529, "env_steps": 2168831999, "loss": 0.002780724549666047, "avg_return": 0.44847503304481506, "regret": 0.3511996567249298, "entropy": 0.07149601727724075, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:34:53.537285Z", "loop": 3530, "env_steps": 2169446399, "loss": 0.002753708278760314, "avg_return": 0.45065680146217346, "regret": 0.35126200318336487, "entropy": 0.07213564962148666, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:34:54.699146Z", "loop": 3531, "env_steps": 2170060799, "loss": 0.0030125256162136793, "avg_return": 0.4499245285987854, "regret": 0.35126200318336487, "entropy": 0.07520680874586105, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:34:55.860629Z", "loop": 3532, "env_steps": 2170675199, "loss": 0.0029705914203077555, "avg_return": 0.4562642574310303, "regret": 0.35126200318336487, "entropy": 0.07296236604452133, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:34:57.023981Z", "loop": 3533, "env_steps": 2171289599, "loss": 0.0026086883153766394, "avg_return": 0.455920934677124, "regret": 0.35126200318336487, "entropy": 0.06672711670398712, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:34:58.188318Z", "loop": 3534, "env_steps": 2171903999, "loss": 0.0023895164486020803, "avg_return": 0.4630524814128876, "regret": 0.35126200318336487, "entropy": 0.06252497434616089, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:34:59.349845Z", "loop": 3535, "env_steps": 2172518399, "loss": 0.0026561939157545567, "avg_return": 0.4531917870044708, "regret": 0.35126200318336487, "entropy": 0.06797558814287186, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:35:00.511535Z", "loop": 3536, "env_steps": 2173132799, "loss": 0.0024140949826687574, "avg_return": 0.45139917731285095, "regret": 0.35126200318336487, "entropy": 0.06778866797685623, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:35:01.672964Z", "loop": 3537, "env_steps": 2173747199, "loss": 0.0023722087498754263, "avg_return": 0.4478019177913666, "regret": 0.35126200318336487, "entropy": 0.05737955868244171, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:35:02.836326Z", "loop": 3538, "env_steps": 2174361599, "loss": 0.0019970580469816923, "avg_return": 0.44757142663002014, "regret": 0.35126200318336487, "entropy": 0.05791664868593216, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:35:03.998861Z", "loop": 3539, "env_steps": 2174975999, "loss": 0.0019543147645890713, "avg_return": 0.4483209252357483, "regret": 0.35126200318336487, "entropy": 0.05621885508298874, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:35:05.208107Z", "loop": 3540, "env_steps": 2175590399, "loss": 0.001917094923555851, "avg_return": 0.453399658203125, "regret": 0.35168448090553284, "entropy": 0.05628402531147003, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:35:06.370137Z", "loop": 3541, "env_steps": 2176204799, "loss": 0.0020312522538006306, "avg_return": 0.46103495359420776, "regret": 0.35168448090553284, "entropy": 0.055382613092660904, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:35:07.531713Z", "loop": 3542, "env_steps": 2176819199, "loss": 0.00176400993950665, "avg_return": 0.4519941210746765, "regret": 0.35168448090553284, "entropy": 0.051098451018333435, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:35:08.694235Z", "loop": 3543, "env_steps": 2177433599, "loss": 0.0020826735999435186, "avg_return": 0.4576815962791443, "regret": 0.35168448090553284, "entropy": 0.05786380544304848, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:35:09.855878Z", "loop": 3544, "env_steps": 2178047999, "loss": 0.0018952075624838471, "avg_return": 0.4466153085231781, "regret": 0.35168448090553284, "entropy": 0.05861737206578255, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:35:11.017257Z", "loop": 3545, "env_steps": 2178662399, "loss": 0.0018304598052054644, "avg_return": 0.4585517942905426, "regret": 0.35168448090553284, "entropy": 0.055046338587999344, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:35:12.179456Z", "loop": 3546, "env_steps": 2179276799, "loss": 0.0024648706894367933, "avg_return": 0.45727142691612244, "regret": 0.35168448090553284, "entropy": 0.06008390337228775, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:35:13.341317Z", "loop": 3547, "env_steps": 2179891199, "loss": 0.002375755226239562, "avg_return": 0.45410147309303284, "regret": 0.35168448090553284, "entropy": 0.06555405259132385, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:35:14.502664Z", "loop": 3548, "env_steps": 2180505599, "loss": 0.0026624235324561596, "avg_return": 0.4445381164550781, "regret": 0.35168448090553284, "entropy": 0.06629034876823425, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:35:15.662775Z", "loop": 3549, "env_steps": 2181119999, "loss": 0.0025217579677700996, "avg_return": 0.44735896587371826, "regret": 0.35168448090553284, "entropy": 0.06763139367103577, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:35:16.869351Z", "loop": 3550, "env_steps": 2181734399, "loss": 0.002753627486526966, "avg_return": 0.4545719027519226, "regret": 0.3507933020591736, "entropy": 0.06465750932693481, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:35:18.030932Z", "loop": 3551, "env_steps": 2182348799, "loss": 0.0026068154256790876, "avg_return": 0.44911307096481323, "regret": 0.3507933020591736, "entropy": 0.06202485039830208, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:35:19.193348Z", "loop": 3552, "env_steps": 2182963199, "loss": 0.0021803162526339293, "avg_return": 0.4500686824321747, "regret": 0.3507933020591736, "entropy": 0.059716735035181046, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:35:20.353816Z", "loop": 3553, "env_steps": 2183577599, "loss": 0.002156967995688319, "avg_return": 0.44992727041244507, "regret": 0.3507933020591736, "entropy": 0.05737007036805153, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:35:21.515472Z", "loop": 3554, "env_steps": 2184191999, "loss": 0.0023361907806247473, "avg_return": 0.4530947506427765, "regret": 0.3507933020591736, "entropy": 0.06048603355884552, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:35:22.677549Z", "loop": 3555, "env_steps": 2184806399, "loss": 0.002157617826014757, "avg_return": 0.44944876432418823, "regret": 0.3507933020591736, "entropy": 0.05974610149860382, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:35:23.839508Z", "loop": 3556, "env_steps": 2185420799, "loss": 0.0017707828665152192, "avg_return": 0.45096275210380554, "regret": 0.3507933020591736, "entropy": 0.05166224017739296, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:35:25.001381Z", "loop": 3557, "env_steps": 2186035199, "loss": 0.0014095727819949389, "avg_return": 0.4520678222179413, "regret": 0.3507933020591736, "entropy": 0.04643309488892555, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:35:26.161625Z", "loop": 3558, "env_steps": 2186649599, "loss": 0.0012336265062913299, "avg_return": 0.4539327621459961, "regret": 0.3507933020591736, "entropy": 0.04566511511802673, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:35:27.324207Z", "loop": 3559, "env_steps": 2187263999, "loss": 0.0010941647924482822, "avg_return": 0.46065354347229004, "regret": 0.3507933020591736, "entropy": 0.04513604938983917, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:35:28.531188Z", "loop": 3560, "env_steps": 2187878399, "loss": 0.0009978736052289605, "avg_return": 0.4548364281654358, "regret": 0.35091114044189453, "entropy": 0.04279697313904762, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:35:29.694967Z", "loop": 3561, "env_steps": 2188492799, "loss": 0.0010565562406554818, "avg_return": 0.44616490602493286, "regret": 0.35091114044189453, "entropy": 0.041064828634262085, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:35:30.855385Z", "loop": 3562, "env_steps": 2189107199, "loss": 0.0009870670037344098, "avg_return": 0.45323893427848816, "regret": 0.35091114044189453, "entropy": 0.041937991976737976, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:35:32.017178Z", "loop": 3563, "env_steps": 2189721599, "loss": 0.0009909708751365542, "avg_return": 0.44928255677223206, "regret": 0.35091114044189453, "entropy": 0.042139507830142975, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:35:33.181068Z", "loop": 3564, "env_steps": 2190335999, "loss": 0.0009570760885253549, "avg_return": 0.44918274879455566, "regret": 0.35091114044189453, "entropy": 0.04014645144343376, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:35:34.343155Z", "loop": 3565, "env_steps": 2190950399, "loss": 0.0009337224182672799, "avg_return": 0.4499160945415497, "regret": 0.35091114044189453, "entropy": 0.041898202151060104, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:35:35.504457Z", "loop": 3566, "env_steps": 2191564799, "loss": 0.0009130900725722313, "avg_return": 0.45037803053855896, "regret": 0.35091114044189453, "entropy": 0.04164232686161995, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:35:36.665929Z", "loop": 3567, "env_steps": 2192179199, "loss": 0.000905303459148854, "avg_return": 0.4571099877357483, "regret": 0.35091114044189453, "entropy": 0.039654530584812164, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:35:37.827060Z", "loop": 3568, "env_steps": 2192793599, "loss": 0.0009510198724456131, "avg_return": 0.4529957175254822, "regret": 0.35091114044189453, "entropy": 0.04419590160250664, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:35:38.990660Z", "loop": 3569, "env_steps": 2193407999, "loss": 0.001094795181415975, "avg_return": 0.4532988667488098, "regret": 0.35091114044189453, "entropy": 0.043016467243433, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:35:40.199379Z", "loop": 3570, "env_steps": 2194022399, "loss": 0.001073045190423727, "avg_return": 0.4555882513523102, "regret": 0.35071390867233276, "entropy": 0.046434517949819565, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:35:41.360444Z", "loop": 3571, "env_steps": 2194636799, "loss": 0.0009767931187525392, "avg_return": 0.4601615369319916, "regret": 0.35071390867233276, "entropy": 0.04284575581550598, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:35:42.522368Z", "loop": 3572, "env_steps": 2195251199, "loss": 0.0009670564904808998, "avg_return": 0.4520858824253082, "regret": 0.35071390867233276, "entropy": 0.04454365745186806, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:35:43.684150Z", "loop": 3573, "env_steps": 2195865599, "loss": 0.0011155485408380628, "avg_return": 0.45399385690689087, "regret": 0.35071390867233276, "entropy": 0.04103376343846321, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:35:44.844921Z", "loop": 3574, "env_steps": 2196479999, "loss": 0.001047165016643703, "avg_return": 0.45634162425994873, "regret": 0.35071390867233276, "entropy": 0.04514202103018761, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:35:46.007260Z", "loop": 3575, "env_steps": 2197094399, "loss": 0.0010848308447748423, "avg_return": 0.45358309149742126, "regret": 0.35071390867233276, "entropy": 0.042368173599243164, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:35:47.169364Z", "loop": 3576, "env_steps": 2197708799, "loss": 0.0010058425832539797, "avg_return": 0.45203152298927307, "regret": 0.35071390867233276, "entropy": 0.04212909936904907, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:35:48.330191Z", "loop": 3577, "env_steps": 2198323199, "loss": 0.001054231426678598, "avg_return": 0.4468235373497009, "regret": 0.35071390867233276, "entropy": 0.043143294751644135, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:35:49.491863Z", "loop": 3578, "env_steps": 2198937599, "loss": 0.000980022712610662, "avg_return": 0.4509351849555969, "regret": 0.35071390867233276, "entropy": 0.04059219732880592, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:35:50.653007Z", "loop": 3579, "env_steps": 2199551999, "loss": 0.0011152372462674975, "avg_return": 0.4516518712043762, "regret": 0.35071390867233276, "entropy": 0.04107879102230072, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:35:51.860410Z", "loop": 3580, "env_steps": 2200166399, "loss": 0.0011889853049069643, "avg_return": 0.4481751620769501, "regret": 0.350660502910614, "entropy": 0.04349557310342789, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:35:53.022773Z", "loop": 3581, "env_steps": 2200780799, "loss": 0.001100148307159543, "avg_return": 0.4511503279209137, "regret": 0.350660502910614, "entropy": 0.03833237662911415, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:35:54.184529Z", "loop": 3582, "env_steps": 2201395199, "loss": 0.0011437436332926154, "avg_return": 0.448648601770401, "regret": 0.350660502910614, "entropy": 0.03928180783987045, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:35:55.345234Z", "loop": 3583, "env_steps": 2202009599, "loss": 0.0010536391055211425, "avg_return": 0.44938167929649353, "regret": 0.350660502910614, "entropy": 0.04458928853273392, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:35:56.507822Z", "loop": 3584, "env_steps": 2202623999, "loss": 0.000974799448158592, "avg_return": 0.4488339424133301, "regret": 0.350660502910614, "entropy": 0.042857516556978226, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:35:57.670069Z", "loop": 3585, "env_steps": 2203238399, "loss": 0.0009060082957148552, "avg_return": 0.4471990168094635, "regret": 0.350660502910614, "entropy": 0.04329046607017517, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:35:58.831151Z", "loop": 3586, "env_steps": 2203852799, "loss": 0.0010881638154387474, "avg_return": 0.45586898922920227, "regret": 0.350660502910614, "entropy": 0.040886811912059784, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:35:59.992938Z", "loop": 3587, "env_steps": 2204467199, "loss": 0.0010512308217585087, "avg_return": 0.4468916356563568, "regret": 0.350660502910614, "entropy": 0.0468703918159008, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:36:01.153099Z", "loop": 3588, "env_steps": 2205081599, "loss": 0.0008960647392086685, "avg_return": 0.45693501830101013, "regret": 0.350660502910614, "entropy": 0.04021747410297394, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:36:02.314588Z", "loop": 3589, "env_steps": 2205695999, "loss": 0.0009824897861108184, "avg_return": 0.45762568712234497, "regret": 0.350660502910614, "entropy": 0.03917191922664642, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:36:03.520243Z", "loop": 3590, "env_steps": 2206310399, "loss": 0.0009853658266365528, "avg_return": 0.4521847665309906, "regret": 0.35070574283599854, "entropy": 0.04605532065033913, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:36:04.681813Z", "loop": 3591, "env_steps": 2206924799, "loss": 0.00108049635309726, "avg_return": 0.44766226410865784, "regret": 0.35070574283599854, "entropy": 0.044758763164281845, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:36:05.842459Z", "loop": 3592, "env_steps": 2207539199, "loss": 0.0008846269338391721, "avg_return": 0.44739624857902527, "regret": 0.35070574283599854, "entropy": 0.03901231661438942, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:36:07.003842Z", "loop": 3593, "env_steps": 2208153599, "loss": 0.0010244314325973392, "avg_return": 0.4527617394924164, "regret": 0.35070574283599854, "entropy": 0.04255286976695061, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:36:08.165069Z", "loop": 3594, "env_steps": 2208767999, "loss": 0.001057146000675857, "avg_return": 0.45617690682411194, "regret": 0.35070574283599854, "entropy": 0.04386298358440399, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:36:09.325084Z", "loop": 3595, "env_steps": 2209382399, "loss": 0.001064507057890296, "avg_return": 0.44445115327835083, "regret": 0.35070574283599854, "entropy": 0.044444695115089417, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:36:10.486774Z", "loop": 3596, "env_steps": 2209996799, "loss": 0.0012921082088723779, "avg_return": 0.4525957405567169, "regret": 0.35070574283599854, "entropy": 0.0454404391348362, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:36:11.647114Z", "loop": 3597, "env_steps": 2210611199, "loss": 0.0013229540782049298, "avg_return": 0.4484768807888031, "regret": 0.35070574283599854, "entropy": 0.04779651015996933, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:36:12.808674Z", "loop": 3598, "env_steps": 2211225599, "loss": 0.0013843164779245853, "avg_return": 0.44973501563072205, "regret": 0.35070574283599854, "entropy": 0.04711470752954483, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:36:13.969514Z", "loop": 3599, "env_steps": 2211839999, "loss": 0.0015219838824123144, "avg_return": 0.4559236764907837, "regret": 0.35070574283599854, "entropy": 0.050345201045274734, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:36:15.175926Z", "loop": 3600, "env_steps": 2212454399, "loss": 0.0016427779337391257, "avg_return": 0.45621034502983093, "regret": 0.3506304919719696, "entropy": 0.04743972048163414, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:36:16.339924Z", "loop": 3601, "env_steps": 2213068799, "loss": 0.0014744214713573456, "avg_return": 0.45649653673171997, "regret": 0.3506304919719696, "entropy": 0.049027033150196075, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:36:17.501051Z", "loop": 3602, "env_steps": 2213683199, "loss": 0.0013009262038394809, "avg_return": 0.4558694660663605, "regret": 0.3506304919719696, "entropy": 0.04551974684000015, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:36:18.662637Z", "loop": 3603, "env_steps": 2214297599, "loss": 0.0013509202981367707, "avg_return": 0.4559529721736908, "regret": 0.3506304919719696, "entropy": 0.0435599721968174, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:36:19.823770Z", "loop": 3604, "env_steps": 2214911999, "loss": 0.0014594270614907146, "avg_return": 0.45093420147895813, "regret": 0.3506304919719696, "entropy": 0.045327078551054, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:36:20.986313Z", "loop": 3605, "env_steps": 2215526399, "loss": 0.001398220076225698, "avg_return": 0.44970959424972534, "regret": 0.3506304919719696, "entropy": 0.04472337290644646, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:36:22.147936Z", "loop": 3606, "env_steps": 2216140799, "loss": 0.0011058920063078403, "avg_return": 0.45485591888427734, "regret": 0.3506304919719696, "entropy": 0.043322984129190445, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:36:23.309046Z", "loop": 3607, "env_steps": 2216755199, "loss": 0.0011078236857429147, "avg_return": 0.45530712604522705, "regret": 0.3506304919719696, "entropy": 0.042483851313591, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:36:24.470455Z", "loop": 3608, "env_steps": 2217369599, "loss": 0.001067166100256145, "avg_return": 0.45402228832244873, "regret": 0.3506304919719696, "entropy": 0.045755185186862946, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:36:25.632887Z", "loop": 3609, "env_steps": 2217983999, "loss": 0.0009974940912798047, "avg_return": 0.4526720941066742, "regret": 0.3506304919719696, "entropy": 0.04315698519349098, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:36:26.850547Z", "loop": 3610, "env_steps": 2218598399, "loss": 0.001012770226225257, "avg_return": 0.4486266076564789, "regret": 0.3506794273853302, "entropy": 0.043794360011816025, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:36:28.012789Z", "loop": 3611, "env_steps": 2219212799, "loss": 0.0011768126860260963, "avg_return": 0.4575493335723877, "regret": 0.3506794273853302, "entropy": 0.04520002380013466, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:36:29.175783Z", "loop": 3612, "env_steps": 2219827199, "loss": 0.001213240553624928, "avg_return": 0.4539670944213867, "regret": 0.3506794273853302, "entropy": 0.04630156606435776, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:36:30.337228Z", "loop": 3613, "env_steps": 2220441599, "loss": 0.0013930503046140075, "avg_return": 0.46106234192848206, "regret": 0.3506794273853302, "entropy": 0.04614480584859848, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:36:31.499289Z", "loop": 3614, "env_steps": 2221055999, "loss": 0.0019825014751404524, "avg_return": 0.45313140749931335, "regret": 0.3506794273853302, "entropy": 0.054936181753873825, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:36:32.662455Z", "loop": 3615, "env_steps": 2221670399, "loss": 0.002173888962715864, "avg_return": 0.45405900478363037, "regret": 0.3506794273853302, "entropy": 0.057554177939891815, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:36:33.823910Z", "loop": 3616, "env_steps": 2222284799, "loss": 0.0023414308670908213, "avg_return": 0.45093679428100586, "regret": 0.3506794273853302, "entropy": 0.061374813318252563, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:36:34.985904Z", "loop": 3617, "env_steps": 2222899199, "loss": 0.002399688120931387, "avg_return": 0.4451069235801697, "regret": 0.3506794273853302, "entropy": 0.05829722434282303, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:36:36.147401Z", "loop": 3618, "env_steps": 2223513599, "loss": 0.002412369940429926, "avg_return": 0.45103782415390015, "regret": 0.3506794273853302, "entropy": 0.06132977455854416, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:36:37.310147Z", "loop": 3619, "env_steps": 2224127999, "loss": 0.0025889643002301455, "avg_return": 0.45182475447654724, "regret": 0.3506794273853302, "entropy": 0.060530904680490494, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:36:38.524671Z", "loop": 3620, "env_steps": 2224742399, "loss": 0.0020678408909589052, "avg_return": 0.44719311594963074, "regret": 0.35571378469467163, "entropy": 0.054469071328639984, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:36:39.685383Z", "loop": 3621, "env_steps": 2225356799, "loss": 0.00232107425108552, "avg_return": 0.44602203369140625, "regret": 0.35571378469467163, "entropy": 0.05575966835021973, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:36:40.847171Z", "loop": 3622, "env_steps": 2225971199, "loss": 0.0022097143810242414, "avg_return": 0.446509450674057, "regret": 0.35571378469467163, "entropy": 0.056678831577301025, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:36:42.007857Z", "loop": 3623, "env_steps": 2226585599, "loss": 0.002205333672463894, "avg_return": 0.4453442394733429, "regret": 0.35571378469467163, "entropy": 0.0569688118994236, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:36:43.169495Z", "loop": 3624, "env_steps": 2227199999, "loss": 0.002062282059341669, "avg_return": 0.44333404302597046, "regret": 0.35571378469467163, "entropy": 0.0563289113342762, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:36:44.330327Z", "loop": 3625, "env_steps": 2227814399, "loss": 0.0021421555429697037, "avg_return": 0.4459174573421478, "regret": 0.35571378469467163, "entropy": 0.05481216683983803, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:36:45.491996Z", "loop": 3626, "env_steps": 2228428799, "loss": 0.0024288531858474016, "avg_return": 0.450957715511322, "regret": 0.35571378469467163, "entropy": 0.057133596390485764, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:36:46.653711Z", "loop": 3627, "env_steps": 2229043199, "loss": 0.0023212109226733446, "avg_return": 0.4505080282688141, "regret": 0.35571378469467163, "entropy": 0.058681610971689224, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:36:47.815800Z", "loop": 3628, "env_steps": 2229657599, "loss": 0.0024583509657531977, "avg_return": 0.4538201093673706, "regret": 0.35571378469467163, "entropy": 0.060691121965646744, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:36:48.978039Z", "loop": 3629, "env_steps": 2230271999, "loss": 0.002401382429525256, "avg_return": 0.44399920105934143, "regret": 0.35571378469467163, "entropy": 0.05983417481184006, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:36:50.183455Z", "loop": 3630, "env_steps": 2230886399, "loss": 0.0025782508309930563, "avg_return": 0.4518962800502777, "regret": 0.3522098660469055, "entropy": 0.06430105865001678, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:36:51.345053Z", "loop": 3631, "env_steps": 2231500799, "loss": 0.0023982941638678312, "avg_return": 0.4535461664199829, "regret": 0.3522098660469055, "entropy": 0.06257306784391403, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:36:52.505840Z", "loop": 3632, "env_steps": 2232115199, "loss": 0.0022055609151721, "avg_return": 0.44263872504234314, "regret": 0.3522098660469055, "entropy": 0.06136085093021393, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:36:53.670441Z", "loop": 3633, "env_steps": 2232729599, "loss": 0.002286473521962762, "avg_return": 0.4545314610004425, "regret": 0.3522098660469055, "entropy": 0.057587411254644394, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:36:54.831193Z", "loop": 3634, "env_steps": 2233343999, "loss": 0.0020418178755789995, "avg_return": 0.4590221345424652, "regret": 0.3522098660469055, "entropy": 0.05622505024075508, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:36:55.992106Z", "loop": 3635, "env_steps": 2233958399, "loss": 0.0019297061953693628, "avg_return": 0.4503383934497833, "regret": 0.3522098660469055, "entropy": 0.0540589801967144, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:36:57.155376Z", "loop": 3636, "env_steps": 2234572799, "loss": 0.0016652418999001384, "avg_return": 0.4533819556236267, "regret": 0.3522098660469055, "entropy": 0.053778182715177536, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:36:58.316874Z", "loop": 3637, "env_steps": 2235187199, "loss": 0.001798922778107226, "avg_return": 0.45192593336105347, "regret": 0.3522098660469055, "entropy": 0.05308711156249046, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:36:59.478356Z", "loop": 3638, "env_steps": 2235801599, "loss": 0.001800946774892509, "avg_return": 0.45701807737350464, "regret": 0.3522098660469055, "entropy": 0.05223647877573967, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:37:00.638467Z", "loop": 3639, "env_steps": 2236415999, "loss": 0.0017250304808840156, "avg_return": 0.4584657847881317, "regret": 0.3522098660469055, "entropy": 0.052906762808561325, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:37:01.845560Z", "loop": 3640, "env_steps": 2237030399, "loss": 0.0015568160451948643, "avg_return": 0.4525187313556671, "regret": 0.35077103972435, "entropy": 0.0525018572807312, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:37:03.005575Z", "loop": 3641, "env_steps": 2237644799, "loss": 0.0015741343377158046, "avg_return": 0.4526418149471283, "regret": 0.35077103972435, "entropy": 0.052495937794446945, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:37:04.167099Z", "loop": 3642, "env_steps": 2238259199, "loss": 0.0015272466698661447, "avg_return": 0.4437175691127777, "regret": 0.35077103972435, "entropy": 0.05042250081896782, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:37:05.327533Z", "loop": 3643, "env_steps": 2238873599, "loss": 0.0015728975413367152, "avg_return": 0.45361456274986267, "regret": 0.35077103972435, "entropy": 0.05169688165187836, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:37:06.488728Z", "loop": 3644, "env_steps": 2239487999, "loss": 0.0017785938689485192, "avg_return": 0.45253729820251465, "regret": 0.35077103972435, "entropy": 0.05319860205054283, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:37:07.650743Z", "loop": 3645, "env_steps": 2240102399, "loss": 0.0015235026367008686, "avg_return": 0.450126975774765, "regret": 0.35077103972435, "entropy": 0.04986052215099335, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:37:08.811961Z", "loop": 3646, "env_steps": 2240716799, "loss": 0.0014664147747680545, "avg_return": 0.4578234851360321, "regret": 0.35077103972435, "entropy": 0.04585723206400871, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:37:09.974587Z", "loop": 3647, "env_steps": 2241331199, "loss": 0.001699697459116578, "avg_return": 0.45684149861335754, "regret": 0.35077103972435, "entropy": 0.04796713963150978, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:37:11.135199Z", "loop": 3648, "env_steps": 2241945599, "loss": 0.0014451518654823303, "avg_return": 0.4556548297405243, "regret": 0.35077103972435, "entropy": 0.04637469723820686, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:37:12.296452Z", "loop": 3649, "env_steps": 2242559999, "loss": 0.0014002051902934909, "avg_return": 0.454006552696228, "regret": 0.35077103972435, "entropy": 0.05091478303074837, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:37:13.503692Z", "loop": 3650, "env_steps": 2243174399, "loss": 0.0014432313619181514, "avg_return": 0.45458272099494934, "regret": 0.3507380783557892, "entropy": 0.051330022513866425, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:37:14.664355Z", "loop": 3651, "env_steps": 2243788799, "loss": 0.0014643041649833322, "avg_return": 0.4548885226249695, "regret": 0.3507380783557892, "entropy": 0.04871971160173416, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:37:15.824703Z", "loop": 3652, "env_steps": 2244403199, "loss": 0.001446282141841948, "avg_return": 0.4477292001247406, "regret": 0.3507380783557892, "entropy": 0.048424191772937775, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:37:16.985354Z", "loop": 3653, "env_steps": 2245017599, "loss": 0.0010775065748021007, "avg_return": 0.4485433101654053, "regret": 0.3507380783557892, "entropy": 0.04790324345231056, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:37:18.146983Z", "loop": 3654, "env_steps": 2245631999, "loss": 0.0011028191074728966, "avg_return": 0.45076391100883484, "regret": 0.3507380783557892, "entropy": 0.04061467573046684, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:37:19.308422Z", "loop": 3655, "env_steps": 2246246399, "loss": 0.0008525088778696954, "avg_return": 0.4595149755477905, "regret": 0.3507380783557892, "entropy": 0.03728700801730156, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:37:20.470134Z", "loop": 3656, "env_steps": 2246860799, "loss": 0.0009986328659579158, "avg_return": 0.4573442041873932, "regret": 0.3507380783557892, "entropy": 0.03930123150348663, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:37:21.629979Z", "loop": 3657, "env_steps": 2247475199, "loss": 0.0008029804448597133, "avg_return": 0.4537700414657593, "regret": 0.3507380783557892, "entropy": 0.038188543170690536, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:37:22.791509Z", "loop": 3658, "env_steps": 2248089599, "loss": 0.0008991832146421075, "avg_return": 0.4517090916633606, "regret": 0.3507380783557892, "entropy": 0.036347661167383194, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:37:23.953131Z", "loop": 3659, "env_steps": 2248703999, "loss": 0.0010136793134734035, "avg_return": 0.45295900106430054, "regret": 0.3507380783557892, "entropy": 0.03868513181805611, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:37:25.158414Z", "loop": 3660, "env_steps": 2249318399, "loss": 0.0010406083893030882, "avg_return": 0.46166902780532837, "regret": 0.35068798065185547, "entropy": 0.04306145757436752, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:37:26.319672Z", "loop": 3661, "env_steps": 2249932799, "loss": 0.0012564602075144649, "avg_return": 0.4560711681842804, "regret": 0.35068798065185547, "entropy": 0.04100481793284416, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:37:27.480422Z", "loop": 3662, "env_steps": 2250547199, "loss": 0.001408010139130056, "avg_return": 0.4503358006477356, "regret": 0.35068798065185547, "entropy": 0.04504495859146118, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:37:28.641580Z", "loop": 3663, "env_steps": 2251161599, "loss": 0.0014995514648035169, "avg_return": 0.4512706995010376, "regret": 0.35068798065185547, "entropy": 0.04932725057005882, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:37:29.802394Z", "loop": 3664, "env_steps": 2251775999, "loss": 0.00156692904420197, "avg_return": 0.455043762922287, "regret": 0.35068798065185547, "entropy": 0.053525760769844055, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:37:30.964038Z", "loop": 3665, "env_steps": 2252390399, "loss": 0.001443974208086729, "avg_return": 0.4550861716270447, "regret": 0.35068798065185547, "entropy": 0.048846129328012466, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:37:32.123884Z", "loop": 3666, "env_steps": 2253004799, "loss": 0.0018483087187632918, "avg_return": 0.4445584714412689, "regret": 0.35068798065185547, "entropy": 0.05615927651524544, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:37:33.285081Z", "loop": 3667, "env_steps": 2253619199, "loss": 0.0021496571134775877, "avg_return": 0.4513792097568512, "regret": 0.35068798065185547, "entropy": 0.053814973682165146, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:37:34.446523Z", "loop": 3668, "env_steps": 2254233599, "loss": 0.002106184372678399, "avg_return": 0.4483436644077301, "regret": 0.35068798065185547, "entropy": 0.0554409921169281, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:37:35.607164Z", "loop": 3669, "env_steps": 2254847999, "loss": 0.0020769955590367317, "avg_return": 0.4545472264289856, "regret": 0.35068798065185547, "entropy": 0.0535733737051487, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:37:36.813099Z", "loop": 3670, "env_steps": 2255462399, "loss": 0.0020932808984071016, "avg_return": 0.45530885457992554, "regret": 0.3516445755958557, "entropy": 0.05571550875902176, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:37:37.974413Z", "loop": 3671, "env_steps": 2256076799, "loss": 0.0020497238729149103, "avg_return": 0.45815709233283997, "regret": 0.3516445755958557, "entropy": 0.0554598830640316, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:37:39.136249Z", "loop": 3672, "env_steps": 2256691199, "loss": 0.0019116665935143828, "avg_return": 0.4535336494445801, "regret": 0.3516445755958557, "entropy": 0.05173889920115471, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:37:40.296734Z", "loop": 3673, "env_steps": 2257305599, "loss": 0.0018837640527635813, "avg_return": 0.44822317361831665, "regret": 0.3516445755958557, "entropy": 0.05544993653893471, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:37:41.458094Z", "loop": 3674, "env_steps": 2257919999, "loss": 0.0017599547281861305, "avg_return": 0.4549504816532135, "regret": 0.3516445755958557, "entropy": 0.05387510731816292, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:37:42.618061Z", "loop": 3675, "env_steps": 2258534399, "loss": 0.0019324299646541476, "avg_return": 0.45538830757141113, "regret": 0.3516445755958557, "entropy": 0.053825441747903824, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:37:43.779952Z", "loop": 3676, "env_steps": 2259148799, "loss": 0.001799442688934505, "avg_return": 0.45262274146080017, "regret": 0.3516445755958557, "entropy": 0.05471835285425186, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:37:44.941753Z", "loop": 3677, "env_steps": 2259763199, "loss": 0.001521838828921318, "avg_return": 0.45638296008110046, "regret": 0.3516445755958557, "entropy": 0.04524361714720726, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:37:46.102276Z", "loop": 3678, "env_steps": 2260377599, "loss": 0.0016388181829825044, "avg_return": 0.44830963015556335, "regret": 0.3516445755958557, "entropy": 0.04876872897148132, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:37:47.263670Z", "loop": 3679, "env_steps": 2260991999, "loss": 0.0016101303044706583, "avg_return": 0.4583093225955963, "regret": 0.3516445755958557, "entropy": 0.047862906008958817, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:37:48.467186Z", "loop": 3680, "env_steps": 2261606399, "loss": 0.0016422290354967117, "avg_return": 0.4523313045501709, "regret": 0.3510545790195465, "entropy": 0.046719297766685486, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:37:49.628954Z", "loop": 3681, "env_steps": 2262220799, "loss": 0.0017281260807067156, "avg_return": 0.46098196506500244, "regret": 0.3510545790195465, "entropy": 0.049171801656484604, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:37:50.790123Z", "loop": 3682, "env_steps": 2262835199, "loss": 0.001797617762349546, "avg_return": 0.45998677611351013, "regret": 0.3510545790195465, "entropy": 0.04925829917192459, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:37:51.952339Z", "loop": 3683, "env_steps": 2263449599, "loss": 0.0016126184491440654, "avg_return": 0.45374584197998047, "regret": 0.3510545790195465, "entropy": 0.04716329276561737, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:37:53.112595Z", "loop": 3684, "env_steps": 2264063999, "loss": 0.0018764134729281068, "avg_return": 0.45446962118148804, "regret": 0.3510545790195465, "entropy": 0.04933273419737816, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:37:54.274084Z", "loop": 3685, "env_steps": 2264678399, "loss": 0.001670142519287765, "avg_return": 0.4523754417896271, "regret": 0.3510545790195465, "entropy": 0.046242181211709976, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:37:55.434866Z", "loop": 3686, "env_steps": 2265292799, "loss": 0.0016253015492111444, "avg_return": 0.4503052234649658, "regret": 0.3510545790195465, "entropy": 0.04697065427899361, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:37:56.595571Z", "loop": 3687, "env_steps": 2265907199, "loss": 0.0017957832897081971, "avg_return": 0.45467254519462585, "regret": 0.3510545790195465, "entropy": 0.048738062381744385, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:37:57.757256Z", "loop": 3688, "env_steps": 2266521599, "loss": 0.0017395602772012353, "avg_return": 0.455061137676239, "regret": 0.3510545790195465, "entropy": 0.045135509222745895, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:37:58.918071Z", "loop": 3689, "env_steps": 2267135999, "loss": 0.001426316681317985, "avg_return": 0.44942402839660645, "regret": 0.3510545790195465, "entropy": 0.04292522370815277, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:38:00.124968Z", "loop": 3690, "env_steps": 2267750399, "loss": 0.001783400191925466, "avg_return": 0.44616129994392395, "regret": 0.3534194529056549, "entropy": 0.050648219883441925, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:38:01.286274Z", "loop": 3691, "env_steps": 2268364799, "loss": 0.0019425895297899842, "avg_return": 0.44720694422721863, "regret": 0.3534194529056549, "entropy": 0.04946569725871086, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:38:02.448151Z", "loop": 3692, "env_steps": 2268979199, "loss": 0.0016182813560590148, "avg_return": 0.4470234811306, "regret": 0.3534194529056549, "entropy": 0.045736003667116165, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:38:03.609031Z", "loop": 3693, "env_steps": 2269593599, "loss": 0.0018832553178071976, "avg_return": 0.4518667161464691, "regret": 0.3534194529056549, "entropy": 0.04610607400536537, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:38:04.770556Z", "loop": 3694, "env_steps": 2270207999, "loss": 0.002109837718307972, "avg_return": 0.45190343260765076, "regret": 0.3534194529056549, "entropy": 0.05041048675775528, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:38:05.937543Z", "loop": 3695, "env_steps": 2270822399, "loss": 0.002140077529475093, "avg_return": 0.45297425985336304, "regret": 0.3534194529056549, "entropy": 0.05508752167224884, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:38:07.098501Z", "loop": 3696, "env_steps": 2271436799, "loss": 0.002053373260423541, "avg_return": 0.44429531693458557, "regret": 0.3534194529056549, "entropy": 0.055561769753694534, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:38:08.260247Z", "loop": 3697, "env_steps": 2272051199, "loss": 0.001848941552452743, "avg_return": 0.44466471672058105, "regret": 0.3534194529056549, "entropy": 0.05065460503101349, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:38:09.420225Z", "loop": 3698, "env_steps": 2272665599, "loss": 0.0017171017825603485, "avg_return": 0.44683966040611267, "regret": 0.3534194529056549, "entropy": 0.052498288452625275, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:38:10.581491Z", "loop": 3699, "env_steps": 2273279999, "loss": 0.0014609459321945906, "avg_return": 0.43710029125213623, "regret": 0.3534194529056549, "entropy": 0.050623610615730286, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:38:11.786037Z", "loop": 3700, "env_steps": 2273894399, "loss": 0.00163325946778059, "avg_return": 0.4507102072238922, "regret": 0.355619341135025, "entropy": 0.0515143983066082, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:38:12.947688Z", "loop": 3701, "env_steps": 2274508799, "loss": 0.0019062863430008292, "avg_return": 0.44980114698410034, "regret": 0.355619341135025, "entropy": 0.05040176585316658, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:38:14.107814Z", "loop": 3702, "env_steps": 2275123199, "loss": 0.001883014920167625, "avg_return": 0.44811901450157166, "regret": 0.355619341135025, "entropy": 0.054811663925647736, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:38:15.269099Z", "loop": 3703, "env_steps": 2275737599, "loss": 0.001715368591248989, "avg_return": 0.4414794445037842, "regret": 0.355619341135025, "entropy": 0.05278000608086586, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:38:16.430715Z", "loop": 3704, "env_steps": 2276351999, "loss": 0.002145567210391164, "avg_return": 0.44877931475639343, "regret": 0.355619341135025, "entropy": 0.057855647057294846, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:38:17.592027Z", "loop": 3705, "env_steps": 2276966399, "loss": 0.0021099476143717766, "avg_return": 0.4514436423778534, "regret": 0.355619341135025, "entropy": 0.05655091255903244, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:38:18.753473Z", "loop": 3706, "env_steps": 2277580799, "loss": 0.0022023660130798817, "avg_return": 0.4545573592185974, "regret": 0.355619341135025, "entropy": 0.05712691321969032, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:38:19.913482Z", "loop": 3707, "env_steps": 2278195199, "loss": 0.002001616870984435, "avg_return": 0.4571641683578491, "regret": 0.355619341135025, "entropy": 0.05131244659423828, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:38:21.074415Z", "loop": 3708, "env_steps": 2278809599, "loss": 0.0017229665536433458, "avg_return": 0.4560021460056305, "regret": 0.355619341135025, "entropy": 0.053053051233291626, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:38:22.233887Z", "loop": 3709, "env_steps": 2279423999, "loss": 0.0016936067258939147, "avg_return": 0.45616206526756287, "regret": 0.355619341135025, "entropy": 0.05260327085852623, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:38:23.437131Z", "loop": 3710, "env_steps": 2280038399, "loss": 0.0019157242495566607, "avg_return": 0.45209819078445435, "regret": 0.3510892987251282, "entropy": 0.04806956276297569, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:38:24.597287Z", "loop": 3711, "env_steps": 2280652799, "loss": 0.0013202119152992964, "avg_return": 0.44821563363075256, "regret": 0.3510892987251282, "entropy": 0.04681111127138138, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:38:25.758435Z", "loop": 3712, "env_steps": 2281267199, "loss": 0.0015116601716727018, "avg_return": 0.4448811411857605, "regret": 0.3510892987251282, "entropy": 0.045821305364370346, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:38:26.918187Z", "loop": 3713, "env_steps": 2281881599, "loss": 0.0016784340841695666, "avg_return": 0.45601686835289, "regret": 0.3510892987251282, "entropy": 0.046633459627628326, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:38:28.079157Z", "loop": 3714, "env_steps": 2282495999, "loss": 0.0016657790401950479, "avg_return": 0.4555113911628723, "regret": 0.3510892987251282, "entropy": 0.053884074091911316, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:38:29.240568Z", "loop": 3715, "env_steps": 2283110399, "loss": 0.002230306388810277, "avg_return": 0.4492621421813965, "regret": 0.3510892987251282, "entropy": 0.0635308101773262, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:38:30.401557Z", "loop": 3716, "env_steps": 2283724799, "loss": 0.00286619714461267, "avg_return": 0.45485591888427734, "regret": 0.3510892987251282, "entropy": 0.06972362846136093, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:38:31.562990Z", "loop": 3717, "env_steps": 2284339199, "loss": 0.0021024083252996206, "avg_return": 0.4541052281856537, "regret": 0.3510892987251282, "entropy": 0.06354515254497528, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:38:32.723943Z", "loop": 3718, "env_steps": 2284953599, "loss": 0.0015697600319981575, "avg_return": 0.4535031318664551, "regret": 0.3510892987251282, "entropy": 0.06387075036764145, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:38:33.885264Z", "loop": 3719, "env_steps": 2285567999, "loss": 0.0008234614506363869, "avg_return": 0.4509563446044922, "regret": 0.3510892987251282, "entropy": 0.06186169385910034, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:38:35.097129Z", "loop": 3720, "env_steps": 2286182399, "loss": 0.0006297612562775612, "avg_return": 0.4528261423110962, "regret": 0.35095658898353577, "entropy": 0.05805784463882446, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:38:36.258784Z", "loop": 3721, "env_steps": 2286796799, "loss": 0.0007205662550404668, "avg_return": 0.4515901803970337, "regret": 0.35095658898353577, "entropy": 0.0548156276345253, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:38:37.420436Z", "loop": 3722, "env_steps": 2287411199, "loss": 0.0009914247784763575, "avg_return": 0.4517654478549957, "regret": 0.35095658898353577, "entropy": 0.0632392093539238, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:38:38.581609Z", "loop": 3723, "env_steps": 2288025599, "loss": 0.0014010543236508965, "avg_return": 0.4522627890110016, "regret": 0.35095658898353577, "entropy": 0.0667676329612732, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:38:39.742785Z", "loop": 3724, "env_steps": 2288639999, "loss": 0.001530289533548057, "avg_return": 0.4538003206253052, "regret": 0.35095658898353577, "entropy": 0.06413798034191132, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:38:40.903291Z", "loop": 3725, "env_steps": 2289254399, "loss": 0.001130668562836945, "avg_return": 0.45405590534210205, "regret": 0.35095658898353577, "entropy": 0.06110357120633125, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:38:42.064838Z", "loop": 3726, "env_steps": 2289868799, "loss": 0.000925281026866287, "avg_return": 0.45047202706336975, "regret": 0.35095658898353577, "entropy": 0.06230003386735916, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:38:43.226398Z", "loop": 3727, "env_steps": 2290483199, "loss": 0.0009436066611669958, "avg_return": 0.45135238766670227, "regret": 0.35095658898353577, "entropy": 0.0643603727221489, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:38:44.387204Z", "loop": 3728, "env_steps": 2291097599, "loss": 0.0007538620266132057, "avg_return": 0.4528019428253174, "regret": 0.35095658898353577, "entropy": 0.066002756357193, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:38:45.548909Z", "loop": 3729, "env_steps": 2291711999, "loss": 0.0009750351309776306, "avg_return": 0.45615866780281067, "regret": 0.35095658898353577, "entropy": 0.061386529356241226, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:38:46.759333Z", "loop": 3730, "env_steps": 2292326399, "loss": 0.0007423415663652122, "avg_return": 0.45178645849227905, "regret": 0.35173457860946655, "entropy": 0.0594770610332489, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:38:47.923392Z", "loop": 3731, "env_steps": 2292940799, "loss": 0.0006436967523768544, "avg_return": 0.4456510543823242, "regret": 0.35173457860946655, "entropy": 0.05685892328619957, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:38:49.085012Z", "loop": 3732, "env_steps": 2293555199, "loss": 0.0005686866934411228, "avg_return": 0.4409356713294983, "regret": 0.35173457860946655, "entropy": 0.057451166212558746, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:38:50.247400Z", "loop": 3733, "env_steps": 2294169599, "loss": 0.000677808653563261, "avg_return": 0.45135098695755005, "regret": 0.35173457860946655, "entropy": 0.051331158727407455, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:38:51.408075Z", "loop": 3734, "env_steps": 2294783999, "loss": 0.00039819820085540414, "avg_return": 0.45327484607696533, "regret": 0.35173457860946655, "entropy": 0.051698051393032074, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:38:52.571313Z", "loop": 3735, "env_steps": 2295398399, "loss": 0.00034097765455953777, "avg_return": 0.45383501052856445, "regret": 0.35173457860946655, "entropy": 0.048463109880685806, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:38:53.734029Z", "loop": 3736, "env_steps": 2296012799, "loss": 0.0005425017443485558, "avg_return": 0.45200115442276, "regret": 0.35173457860946655, "entropy": 0.05186796560883522, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:38:54.895159Z", "loop": 3737, "env_steps": 2296627199, "loss": 0.0005506055313162506, "avg_return": 0.45210716128349304, "regret": 0.35173457860946655, "entropy": 0.05398779734969139, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:38:56.057022Z", "loop": 3738, "env_steps": 2297241599, "loss": 0.0005291083944030106, "avg_return": 0.4551951289176941, "regret": 0.35173457860946655, "entropy": 0.04843733087182045, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:38:57.218228Z", "loop": 3739, "env_steps": 2297855999, "loss": 0.0006670957081951201, "avg_return": 0.45609161257743835, "regret": 0.35173457860946655, "entropy": 0.04882577806711197, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:38:58.430544Z", "loop": 3740, "env_steps": 2298470399, "loss": 0.0008414755575358868, "avg_return": 0.4463559091091156, "regret": 0.3525752127170563, "entropy": 0.05010131746530533, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:38:59.592358Z", "loop": 3741, "env_steps": 2299084799, "loss": 0.0011871273163706064, "avg_return": 0.449695348739624, "regret": 0.3525752127170563, "entropy": 0.05478713661432266, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:39:00.754460Z", "loop": 3742, "env_steps": 2299699199, "loss": 0.001104105613194406, "avg_return": 0.44940218329429626, "regret": 0.3525752127170563, "entropy": 0.05411592498421669, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:39:01.916664Z", "loop": 3743, "env_steps": 2300313599, "loss": 0.0011644624173641205, "avg_return": 0.4476935863494873, "regret": 0.3525752127170563, "entropy": 0.05239017307758331, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:39:03.078176Z", "loop": 3744, "env_steps": 2300927999, "loss": 0.0010603702394291759, "avg_return": 0.45245057344436646, "regret": 0.3525752127170563, "entropy": 0.05518496409058571, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:39:04.240657Z", "loop": 3745, "env_steps": 2301542399, "loss": 0.0007131880847737193, "avg_return": 0.45510396361351013, "regret": 0.3525752127170563, "entropy": 0.04909538850188255, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:39:05.401501Z", "loop": 3746, "env_steps": 2302156799, "loss": 0.0006057368009351194, "avg_return": 0.4516945481300354, "regret": 0.3525752127170563, "entropy": 0.049447912722826004, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:39:06.563430Z", "loop": 3747, "env_steps": 2302771199, "loss": 0.0004385020292829722, "avg_return": 0.45026206970214844, "regret": 0.3525752127170563, "entropy": 0.05113665759563446, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:39:07.726042Z", "loop": 3748, "env_steps": 2303385599, "loss": 0.00047088065184652805, "avg_return": 0.45429566502571106, "regret": 0.3525752127170563, "entropy": 0.05165481939911842, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:39:08.887388Z", "loop": 3749, "env_steps": 2303999999, "loss": 0.000546395720448345, "avg_return": 0.45461875200271606, "regret": 0.3525752127170563, "entropy": 0.0542023703455925, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:39:10.094279Z", "loop": 3750, "env_steps": 2304614399, "loss": 0.000525532232131809, "avg_return": 0.4480810761451721, "regret": 0.3509516417980194, "entropy": 0.05522080510854721, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:39:11.255426Z", "loop": 3751, "env_steps": 2305228799, "loss": 0.0006422551232390106, "avg_return": 0.45609405636787415, "regret": 0.3509516417980194, "entropy": 0.05364019423723221, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:39:12.417464Z", "loop": 3752, "env_steps": 2305843199, "loss": 0.0006921768072061241, "avg_return": 0.44913655519485474, "regret": 0.3509516417980194, "entropy": 0.0614502876996994, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:39:13.577753Z", "loop": 3753, "env_steps": 2306457599, "loss": 0.0008515215595252812, "avg_return": 0.4503963887691498, "regret": 0.3509516417980194, "entropy": 0.06187242269515991, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:39:14.739597Z", "loop": 3754, "env_steps": 2307071999, "loss": 0.0007265066378749907, "avg_return": 0.4574946165084839, "regret": 0.3509516417980194, "entropy": 0.05954110622406006, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:39:15.900448Z", "loop": 3755, "env_steps": 2307686399, "loss": 0.0006983847124502063, "avg_return": 0.44680675864219666, "regret": 0.3509516417980194, "entropy": 0.05848906189203262, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:39:17.062561Z", "loop": 3756, "env_steps": 2308300799, "loss": 0.0008263601339422166, "avg_return": 0.45279979705810547, "regret": 0.3509516417980194, "entropy": 0.05786997452378273, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:39:18.224055Z", "loop": 3757, "env_steps": 2308915199, "loss": 0.0007925500976853073, "avg_return": 0.45307302474975586, "regret": 0.3509516417980194, "entropy": 0.061888642609119415, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:39:19.386156Z", "loop": 3758, "env_steps": 2309529599, "loss": 0.0007455278537236154, "avg_return": 0.4518686532974243, "regret": 0.3509516417980194, "entropy": 0.06440304219722748, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:39:20.548093Z", "loop": 3759, "env_steps": 2310143999, "loss": 0.0008610633085481822, "avg_return": 0.44917964935302734, "regret": 0.3509516417980194, "entropy": 0.06697805970907211, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:39:21.753012Z", "loop": 3760, "env_steps": 2310758399, "loss": 0.0008694942225702107, "avg_return": 0.44776323437690735, "regret": 0.3506505489349365, "entropy": 0.0625016987323761, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:39:22.917243Z", "loop": 3761, "env_steps": 2311372799, "loss": 0.000999337644316256, "avg_return": 0.4539968967437744, "regret": 0.3506505489349365, "entropy": 0.0666050836443901, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:39:24.080079Z", "loop": 3762, "env_steps": 2311987199, "loss": 0.0009045004844665527, "avg_return": 0.45517227053642273, "regret": 0.3506505489349365, "entropy": 0.07046274095773697, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:39:25.245145Z", "loop": 3763, "env_steps": 2312601599, "loss": 0.0010224796133115888, "avg_return": 0.4532252252101898, "regret": 0.3506505489349365, "entropy": 0.060961801558732986, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:39:26.407862Z", "loop": 3764, "env_steps": 2313215999, "loss": 0.001037629204802215, "avg_return": 0.4518876373767853, "regret": 0.3506505489349365, "entropy": 0.06421014666557312, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:39:27.567809Z", "loop": 3765, "env_steps": 2313830399, "loss": 0.0011467159492895007, "avg_return": 0.45139262080192566, "regret": 0.3506505489349365, "entropy": 0.06281081587076187, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:39:28.729669Z", "loop": 3766, "env_steps": 2314444799, "loss": 0.0010566571727395058, "avg_return": 0.4524388611316681, "regret": 0.3506505489349365, "entropy": 0.06685229390859604, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:39:29.890204Z", "loop": 3767, "env_steps": 2315059199, "loss": 0.0011974532390013337, "avg_return": 0.44858404994010925, "regret": 0.3506505489349365, "entropy": 0.06941531598567963, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} +{"ts": "2026-01-29T22:39:31.050732Z", "loop": 3768, "env_steps": 2315673599, "loss": 0.0012299276422709227, "avg_return": 0.44822484254837036, "regret": 0.3506505489349365, "entropy": 0.06963272392749786, "lr": 5e-05, "discount_rate": 0.97, "num_rollout_steps": 64} diff --git a/al_0.6_g_0.97_id_11_seed_970611/train.log b/al_0.6_g_0.97_id_11_seed_970611/train.log new file mode 100644 index 0000000000000000000000000000000000000000..15566ccbf1ffb15ca64f5b6278a01b2371d68202 --- /dev/null +++ b/al_0.6_g_0.97_id_11_seed_970611/train.log @@ -0,0 +1,3769 @@ +[2026-01-29T21:25:57.840988Z] Loop 0: Loss: 1.41e-02, Avg Return: 0.087, Regret: 0.7080, Entropy: 1.3863 +[2026-01-29T21:25:59.054150Z] Loop 1: Loss: 1.42e-02, Avg Return: 0.085, Regret: 0.7076, Entropy: 1.3863 +[2026-01-29T21:26:00.265894Z] Loop 2: Loss: 1.34e-02, Avg Return: 0.085, Regret: 0.7073, Entropy: 1.3863 +[2026-01-29T21:26:01.473350Z] Loop 3: Loss: 1.44e-02, Avg Return: 0.094, Regret: 0.7070, Entropy: 1.3863 +[2026-01-29T21:26:02.676328Z] Loop 4: Loss: 1.41e-02, Avg Return: 0.089, Regret: 0.7067, Entropy: 1.3863 +[2026-01-29T21:26:03.880329Z] Loop 5: Loss: 1.41e-02, Avg Return: 0.091, Regret: 0.7064, Entropy: 1.3863 +[2026-01-29T21:26:05.094812Z] Loop 6: Loss: 1.48e-02, Avg Return: 0.089, Regret: 0.7061, Entropy: 1.3863 +[2026-01-29T21:26:06.310786Z] Loop 7: Loss: 1.39e-02, Avg Return: 0.090, Regret: 0.7058, Entropy: 1.3863 +[2026-01-29T21:26:07.521493Z] Loop 8: Loss: 1.57e-02, Avg Return: 0.089, Regret: 0.7055, Entropy: 1.3862 +[2026-01-29T21:26:08.724719Z] Loop 9: Loss: 1.65e-02, Avg Return: 0.093, Regret: 0.7052, Entropy: 1.3862 +[2026-01-29T21:26:09.929209Z] Loop 10: Loss: 1.68e-02, Avg Return: 0.094, Regret: 0.7049, Entropy: 1.3862 +[2026-01-29T21:26:11.131732Z] Loop 11: Loss: 1.51e-02, Avg Return: 0.091, Regret: 0.7046, Entropy: 1.3862 +[2026-01-29T21:26:12.339013Z] Loop 12: Loss: 1.40e-02, Avg Return: 0.089, Regret: 0.7043, Entropy: 1.3862 +[2026-01-29T21:26:13.548955Z] Loop 13: Loss: 1.44e-02, Avg Return: 0.093, Regret: 0.7040, Entropy: 1.3861 +[2026-01-29T21:26:14.757499Z] Loop 14: Loss: 1.62e-02, Avg Return: 0.093, Regret: 0.7036, Entropy: 1.3861 +[2026-01-29T21:26:15.962940Z] Loop 15: Loss: 1.51e-02, Avg Return: 0.092, Regret: 0.7032, Entropy: 1.3861 +[2026-01-29T21:26:17.165342Z] Loop 16: Loss: 1.41e-02, Avg Return: 0.090, Regret: 0.7029, Entropy: 1.3860 +[2026-01-29T21:26:18.373136Z] Loop 17: Loss: 1.60e-02, Avg Return: 0.094, Regret: 0.7025, Entropy: 1.3860 +[2026-01-29T21:26:19.578404Z] Loop 18: Loss: 1.51e-02, Avg Return: 0.091, Regret: 0.7021, Entropy: 1.3859 +[2026-01-29T21:26:20.783615Z] Loop 19: Loss: 1.54e-02, Avg Return: 0.089, Regret: 0.7016, Entropy: 1.3859 +[2026-01-29T21:26:21.993224Z] Loop 20: Loss: 1.50e-02, Avg Return: 0.093, Regret: 0.7012, Entropy: 1.3858 +[2026-01-29T21:26:23.202091Z] Loop 21: Loss: 1.47e-02, Avg Return: 0.088, Regret: 0.7007, Entropy: 1.3857 +[2026-01-29T21:26:24.409810Z] Loop 22: Loss: 1.49e-02, Avg Return: 0.097, Regret: 0.7002, Entropy: 1.3857 +[2026-01-29T21:26:25.612713Z] Loop 23: Loss: 1.58e-02, Avg Return: 0.092, Regret: 0.6997, Entropy: 1.3856 +[2026-01-29T21:26:26.815895Z] Loop 24: Loss: 1.44e-02, Avg Return: 0.093, Regret: 0.6992, Entropy: 1.3855 +[2026-01-29T21:26:28.017873Z] Loop 25: Loss: 1.61e-02, Avg Return: 0.098, Regret: 0.6986, Entropy: 1.3854 +[2026-01-29T21:26:29.217839Z] Loop 26: Loss: 1.60e-02, Avg Return: 0.098, Regret: 0.6980, Entropy: 1.3852 +[2026-01-29T21:26:30.427831Z] Loop 27: Loss: 1.61e-02, Avg Return: 0.098, Regret: 0.6973, Entropy: 1.3851 +[2026-01-29T21:26:31.630408Z] Loop 28: Loss: 1.72e-02, Avg Return: 0.092, Regret: 0.6966, Entropy: 1.3849 +[2026-01-29T21:26:32.832097Z] Loop 29: Loss: 1.69e-02, Avg Return: 0.097, Regret: 0.6959, Entropy: 1.3848 +[2026-01-29T21:26:34.038186Z] Loop 30: Loss: 1.84e-02, Avg Return: 0.096, Regret: 0.6951, Entropy: 1.3846 +[2026-01-29T21:26:35.242256Z] Loop 31: Loss: 1.74e-02, Avg Return: 0.097, Regret: 0.6942, Entropy: 1.3844 +[2026-01-29T21:26:36.447404Z] Loop 32: Loss: 1.63e-02, Avg Return: 0.099, Regret: 0.6933, Entropy: 1.3841 +[2026-01-29T21:26:37.651271Z] Loop 33: Loss: 1.81e-02, Avg Return: 0.097, Regret: 0.6923, Entropy: 1.3838 +[2026-01-29T21:26:38.853158Z] Loop 34: Loss: 1.72e-02, Avg Return: 0.101, Regret: 0.6912, Entropy: 1.3835 +[2026-01-29T21:26:40.056461Z] Loop 35: Loss: 1.66e-02, Avg Return: 0.103, Regret: 0.6901, Entropy: 1.3832 +[2026-01-29T21:26:41.261046Z] Loop 36: Loss: 1.94e-02, Avg Return: 0.104, Regret: 0.6889, Entropy: 1.3828 +[2026-01-29T21:26:42.467552Z] Loop 37: Loss: 1.99e-02, Avg Return: 0.102, Regret: 0.6876, Entropy: 1.3824 +[2026-01-29T21:26:43.670186Z] Loop 38: Loss: 1.71e-02, Avg Return: 0.104, Regret: 0.6863, Entropy: 1.3819 +[2026-01-29T21:26:44.872976Z] Loop 39: Loss: 2.11e-02, Avg Return: 0.108, Regret: 0.6848, Entropy: 1.3814 +[2026-01-29T21:26:46.074852Z] Loop 40: Loss: 1.99e-02, Avg Return: 0.110, Regret: 0.6831, Entropy: 1.3808 +[2026-01-29T21:26:47.277221Z] Loop 41: Loss: 1.89e-02, Avg Return: 0.106, Regret: 0.6814, Entropy: 1.3801 +[2026-01-29T21:26:48.479121Z] Loop 42: Loss: 2.12e-02, Avg Return: 0.111, Regret: 0.6795, Entropy: 1.3793 +[2026-01-29T21:26:49.681508Z] Loop 43: Loss: 2.12e-02, Avg Return: 0.112, Regret: 0.6773, Entropy: 1.3784 +[2026-01-29T21:26:50.883412Z] Loop 44: Loss: 2.22e-02, Avg Return: 0.119, Regret: 0.6750, Entropy: 1.3773 +[2026-01-29T21:26:52.086313Z] Loop 45: Loss: 2.32e-02, Avg Return: 0.119, Regret: 0.6725, Entropy: 1.3761 +[2026-01-29T21:26:53.288310Z] Loop 46: Loss: 2.21e-02, Avg Return: 0.122, Regret: 0.6697, Entropy: 1.3748 +[2026-01-29T21:26:54.490079Z] Loop 47: Loss: 2.28e-02, Avg Return: 0.123, Regret: 0.6667, Entropy: 1.3732 +[2026-01-29T21:26:55.694363Z] Loop 48: Loss: 2.49e-02, Avg Return: 0.127, Regret: 0.6634, Entropy: 1.3715 +[2026-01-29T21:26:56.898257Z] Loop 49: Loss: 2.51e-02, Avg Return: 0.131, Regret: 0.6598, Entropy: 1.3694 +[2026-01-29T21:26:58.103325Z] Loop 50: Loss: 2.64e-02, Avg Return: 0.135, Regret: 0.6559, Entropy: 1.3670 +[2026-01-29T21:26:59.306270Z] Loop 51: Loss: 2.81e-02, Avg Return: 0.138, Regret: 0.6516, Entropy: 1.3643 +[2026-01-29T21:27:00.507528Z] Loop 52: Loss: 2.76e-02, Avg Return: 0.140, Regret: 0.6469, Entropy: 1.3611 +[2026-01-29T21:27:01.708423Z] Loop 53: Loss: 2.91e-02, Avg Return: 0.142, Regret: 0.6418, Entropy: 1.3574 +[2026-01-29T21:27:02.914261Z] Loop 54: Loss: 3.17e-02, Avg Return: 0.151, Regret: 0.6363, Entropy: 1.3530 +[2026-01-29T21:27:04.117935Z] Loop 55: Loss: 3.39e-02, Avg Return: 0.162, Regret: 0.6305, Entropy: 1.3481 +[2026-01-29T21:27:05.320335Z] Loop 56: Loss: 3.46e-02, Avg Return: 0.167, Regret: 0.6242, Entropy: 1.3423 +[2026-01-29T21:27:06.521962Z] Loop 57: Loss: 3.55e-02, Avg Return: 0.175, Regret: 0.6176, Entropy: 1.3356 +[2026-01-29T21:27:07.725152Z] Loop 58: Loss: 4.05e-02, Avg Return: 0.185, Regret: 0.6107, Entropy: 1.3279 +[2026-01-29T21:27:08.930186Z] Loop 59: Loss: 4.00e-02, Avg Return: 0.189, Regret: 0.6035, Entropy: 1.3190 +[2026-01-29T21:27:10.132797Z] Loop 60: Loss: 4.20e-02, Avg Return: 0.196, Regret: 0.5961, Entropy: 1.3087 +[2026-01-29T21:27:11.335028Z] Loop 61: Loss: 4.30e-02, Avg Return: 0.207, Regret: 0.5886, Entropy: 1.2968 +[2026-01-29T21:27:12.538352Z] Loop 62: Loss: 4.40e-02, Avg Return: 0.215, Regret: 0.5810, Entropy: 1.2835 +[2026-01-29T21:27:13.742864Z] Loop 63: Loss: 4.09e-02, Avg Return: 0.226, Regret: 0.5735, Entropy: 1.2682 +[2026-01-29T21:27:14.945594Z] Loop 64: Loss: 4.21e-02, Avg Return: 0.232, Regret: 0.5661, Entropy: 1.2511 +[2026-01-29T21:27:16.149199Z] Loop 65: Loss: 4.31e-02, Avg Return: 0.243, Regret: 0.5589, Entropy: 1.2319 +[2026-01-29T21:27:17.353363Z] Loop 66: Loss: 4.05e-02, Avg Return: 0.247, Regret: 0.5521, Entropy: 1.2107 +[2026-01-29T21:27:18.556520Z] Loop 67: Loss: 3.97e-02, Avg Return: 0.260, Regret: 0.5456, Entropy: 1.1878 +[2026-01-29T21:27:19.759204Z] Loop 68: Loss: 3.74e-02, Avg Return: 0.264, Regret: 0.5397, Entropy: 1.1635 +[2026-01-29T21:27:20.968300Z] Loop 69: Loss: 3.52e-02, Avg Return: 0.263, Regret: 0.5342, Entropy: 1.1378 +[2026-01-29T21:27:22.171019Z] Loop 70: Loss: 3.48e-02, Avg Return: 0.278, Regret: 0.5292, Entropy: 1.1110 +[2026-01-29T21:27:23.374017Z] Loop 71: Loss: 3.20e-02, Avg Return: 0.281, Regret: 0.5246, Entropy: 1.0841 +[2026-01-29T21:27:24.578499Z] Loop 72: Loss: 3.08e-02, Avg Return: 0.279, Regret: 0.5206, Entropy: 1.0565 +[2026-01-29T21:27:25.784153Z] Loop 73: Loss: 3.06e-02, Avg Return: 0.281, Regret: 0.5170, Entropy: 1.0294 +[2026-01-29T21:27:26.987191Z] Loop 74: Loss: 3.01e-02, Avg Return: 0.291, Regret: 0.5138, Entropy: 1.0027 +[2026-01-29T21:27:28.194186Z] Loop 75: Loss: 2.65e-02, Avg Return: 0.293, Regret: 0.5110, Entropy: 0.9765 +[2026-01-29T21:27:29.397946Z] Loop 76: Loss: 2.74e-02, Avg Return: 0.300, Regret: 0.5085, Entropy: 0.9518 +[2026-01-29T21:27:30.601947Z] Loop 77: Loss: 2.35e-02, Avg Return: 0.288, Regret: 0.5063, Entropy: 0.9286 +[2026-01-29T21:27:31.805055Z] Loop 78: Loss: 2.45e-02, Avg Return: 0.298, Regret: 0.5044, Entropy: 0.9070 +[2026-01-29T21:27:33.008915Z] Loop 79: Loss: 2.34e-02, Avg Return: 0.300, Regret: 0.5027, Entropy: 0.8876 +[2026-01-29T21:27:34.213905Z] Loop 80: Loss: 2.18e-02, Avg Return: 0.299, Regret: 0.5012, Entropy: 0.8698 +[2026-01-29T21:27:35.452786Z] Loop 81: Loss: 2.13e-02, Avg Return: 0.298, Regret: 0.4999, Entropy: 0.8529 +[2026-01-29T21:27:36.659298Z] Loop 82: Loss: 2.09e-02, Avg Return: 0.306, Regret: 0.4987, Entropy: 0.8376 +[2026-01-29T21:27:37.862669Z] Loop 83: Loss: 1.93e-02, Avg Return: 0.301, Regret: 0.4978, Entropy: 0.8237 +[2026-01-29T21:27:39.068288Z] Loop 84: Loss: 2.05e-02, Avg Return: 0.307, Regret: 0.4970, Entropy: 0.8112 +[2026-01-29T21:27:40.276797Z] Loop 85: Loss: 1.95e-02, Avg Return: 0.305, Regret: 0.4964, Entropy: 0.8003 +[2026-01-29T21:27:41.479876Z] Loop 86: Loss: 1.88e-02, Avg Return: 0.311, Regret: 0.4960, Entropy: 0.7904 +[2026-01-29T21:27:42.684158Z] Loop 87: Loss: 1.91e-02, Avg Return: 0.311, Regret: 0.4957, Entropy: 0.7815 +[2026-01-29T21:27:43.886695Z] Loop 88: Loss: 1.94e-02, Avg Return: 0.316, Regret: 0.4955, Entropy: 0.7731 +[2026-01-29T21:27:45.092323Z] Loop 89: Loss: 1.82e-02, Avg Return: 0.306, Regret: 0.4954, Entropy: 0.7658 +[2026-01-29T21:27:46.296765Z] Loop 90: Loss: 1.98e-02, Avg Return: 0.308, Regret: 0.4952, Entropy: 0.7592 +[2026-01-29T21:27:47.501234Z] Loop 91: Loss: 1.82e-02, Avg Return: 0.310, Regret: 0.4950, Entropy: 0.7537 +[2026-01-29T21:27:48.709350Z] Loop 92: Loss: 1.97e-02, Avg Return: 0.312, Regret: 0.4947, Entropy: 0.7490 +[2026-01-29T21:27:49.918912Z] Loop 93: Loss: 1.90e-02, Avg Return: 0.309, Regret: 0.4944, Entropy: 0.7450 +[2026-01-29T21:27:51.124894Z] Loop 94: Loss: 1.64e-02, Avg Return: 0.307, Regret: 0.4941, Entropy: 0.7415 +[2026-01-29T21:27:52.330244Z] Loop 95: Loss: 1.70e-02, Avg Return: 0.307, Regret: 0.4939, Entropy: 0.7384 +[2026-01-29T21:27:53.534439Z] Loop 96: Loss: 1.82e-02, Avg Return: 0.306, Regret: 0.4937, Entropy: 0.7357 +[2026-01-29T21:27:54.737886Z] Loop 97: Loss: 1.79e-02, Avg Return: 0.310, Regret: 0.4937, Entropy: 0.7328 +[2026-01-29T21:27:55.942535Z] Loop 98: Loss: 1.73e-02, Avg Return: 0.309, Regret: 0.4939, Entropy: 0.7298 +[2026-01-29T21:27:57.146729Z] Loop 99: Loss: 1.77e-02, Avg Return: 0.314, Regret: 0.4941, Entropy: 0.7265 +[2026-01-29T21:27:58.350582Z] Loop 100: Loss: 1.68e-02, Avg Return: 0.313, Regret: 0.4943, Entropy: 0.7234 +[2026-01-29T21:27:59.555484Z] Loop 101: Loss: 1.81e-02, Avg Return: 0.314, Regret: 0.4943, Entropy: 0.7215 +[2026-01-29T21:28:00.761468Z] Loop 102: Loss: 1.79e-02, Avg Return: 0.313, Regret: 0.4942, Entropy: 0.7205 +[2026-01-29T21:28:01.969668Z] Loop 103: Loss: 1.80e-02, Avg Return: 0.308, Regret: 0.4940, Entropy: 0.7202 +[2026-01-29T21:28:03.176508Z] Loop 104: Loss: 1.69e-02, Avg Return: 0.313, Regret: 0.4937, Entropy: 0.7201 +[2026-01-29T21:28:04.377451Z] Loop 105: Loss: 1.72e-02, Avg Return: 0.310, Regret: 0.4935, Entropy: 0.7204 +[2026-01-29T21:28:05.581798Z] Loop 106: Loss: 1.72e-02, Avg Return: 0.313, Regret: 0.4933, Entropy: 0.7205 +[2026-01-29T21:28:06.785131Z] Loop 107: Loss: 1.92e-02, Avg Return: 0.310, Regret: 0.4933, Entropy: 0.7204 +[2026-01-29T21:28:07.996422Z] Loop 108: Loss: 1.82e-02, Avg Return: 0.310, Regret: 0.4933, Entropy: 0.7198 +[2026-01-29T21:28:09.202670Z] Loop 109: Loss: 1.68e-02, Avg Return: 0.310, Regret: 0.4934, Entropy: 0.7191 +[2026-01-29T21:28:10.404701Z] Loop 110: Loss: 1.74e-02, Avg Return: 0.311, Regret: 0.4936, Entropy: 0.7183 +[2026-01-29T21:28:11.606239Z] Loop 111: Loss: 1.73e-02, Avg Return: 0.302, Regret: 0.4937, Entropy: 0.7177 +[2026-01-29T21:28:12.808391Z] Loop 112: Loss: 1.70e-02, Avg Return: 0.309, Regret: 0.4938, Entropy: 0.7171 +[2026-01-29T21:28:14.011675Z] Loop 113: Loss: 1.75e-02, Avg Return: 0.311, Regret: 0.4939, Entropy: 0.7164 +[2026-01-29T21:28:15.214542Z] Loop 114: Loss: 1.83e-02, Avg Return: 0.313, Regret: 0.4940, Entropy: 0.7162 +[2026-01-29T21:28:16.417341Z] Loop 115: Loss: 1.75e-02, Avg Return: 0.312, Regret: 0.4939, Entropy: 0.7159 +[2026-01-29T21:28:17.618649Z] Loop 116: Loss: 1.71e-02, Avg Return: 0.309, Regret: 0.4939, Entropy: 0.7153 +[2026-01-29T21:28:18.822597Z] Loop 117: Loss: 1.75e-02, Avg Return: 0.310, Regret: 0.4937, Entropy: 0.7153 +[2026-01-29T21:28:20.025685Z] Loop 118: Loss: 1.72e-02, Avg Return: 0.311, Regret: 0.4936, Entropy: 0.7152 +[2026-01-29T21:28:21.229120Z] Loop 119: Loss: 1.70e-02, Avg Return: 0.306, Regret: 0.4934, Entropy: 0.7154 +[2026-01-29T21:28:22.430973Z] Loop 120: Loss: 1.79e-02, Avg Return: 0.309, Regret: 0.4932, Entropy: 0.7155 +[2026-01-29T21:28:23.634202Z] Loop 121: Loss: 1.67e-02, Avg Return: 0.308, Regret: 0.4931, Entropy: 0.7153 +[2026-01-29T21:28:24.835766Z] Loop 122: Loss: 1.74e-02, Avg Return: 0.303, Regret: 0.4932, Entropy: 0.7146 +[2026-01-29T21:28:26.037712Z] Loop 123: Loss: 1.82e-02, Avg Return: 0.314, Regret: 0.4934, Entropy: 0.7135 +[2026-01-29T21:28:27.238705Z] Loop 124: Loss: 1.77e-02, Avg Return: 0.309, Regret: 0.4937, Entropy: 0.7122 +[2026-01-29T21:28:28.445074Z] Loop 125: Loss: 1.69e-02, Avg Return: 0.305, Regret: 0.4940, Entropy: 0.7108 +[2026-01-29T21:28:29.648981Z] Loop 126: Loss: 1.67e-02, Avg Return: 0.304, Regret: 0.4941, Entropy: 0.7105 +[2026-01-29T21:28:30.853474Z] Loop 127: Loss: 1.75e-02, Avg Return: 0.313, Regret: 0.4941, Entropy: 0.7104 +[2026-01-29T21:28:32.056716Z] Loop 128: Loss: 1.60e-02, Avg Return: 0.311, Regret: 0.4940, Entropy: 0.7106 +[2026-01-29T21:28:33.261784Z] Loop 129: Loss: 1.74e-02, Avg Return: 0.312, Regret: 0.4937, Entropy: 0.7116 +[2026-01-29T21:28:34.465237Z] Loop 130: Loss: 1.82e-02, Avg Return: 0.313, Regret: 0.4934, Entropy: 0.7123 +[2026-01-29T21:28:35.668178Z] Loop 131: Loss: 1.64e-02, Avg Return: 0.314, Regret: 0.4932, Entropy: 0.7131 +[2026-01-29T21:28:36.871311Z] Loop 132: Loss: 1.65e-02, Avg Return: 0.312, Regret: 0.4931, Entropy: 0.7133 +[2026-01-29T21:28:38.076270Z] Loop 133: Loss: 1.67e-02, Avg Return: 0.309, Regret: 0.4931, Entropy: 0.7133 +[2026-01-29T21:28:39.280418Z] Loop 134: Loss: 1.63e-02, Avg Return: 0.309, Regret: 0.4931, Entropy: 0.7130 +[2026-01-29T21:28:40.485781Z] Loop 135: Loss: 1.64e-02, Avg Return: 0.318, Regret: 0.4932, Entropy: 0.7126 +[2026-01-29T21:28:41.690704Z] Loop 136: Loss: 1.73e-02, Avg Return: 0.308, Regret: 0.4933, Entropy: 0.7121 +[2026-01-29T21:28:42.896527Z] Loop 137: Loss: 1.67e-02, Avg Return: 0.308, Regret: 0.4934, Entropy: 0.7117 +[2026-01-29T21:28:44.102064Z] Loop 138: Loss: 1.72e-02, Avg Return: 0.314, Regret: 0.4935, Entropy: 0.7113 +[2026-01-29T21:28:45.307803Z] Loop 139: Loss: 1.61e-02, Avg Return: 0.313, Regret: 0.4936, Entropy: 0.7110 +[2026-01-29T21:28:46.512059Z] Loop 140: Loss: 1.67e-02, Avg Return: 0.312, Regret: 0.4935, Entropy: 0.7113 +[2026-01-29T21:28:47.716877Z] Loop 141: Loss: 1.72e-02, Avg Return: 0.309, Regret: 0.4933, Entropy: 0.7118 +[2026-01-29T21:28:48.922412Z] Loop 142: Loss: 1.85e-02, Avg Return: 0.314, Regret: 0.4931, Entropy: 0.7122 +[2026-01-29T21:28:50.129258Z] Loop 143: Loss: 1.70e-02, Avg Return: 0.305, Regret: 0.4930, Entropy: 0.7124 +[2026-01-29T21:28:51.336262Z] Loop 144: Loss: 1.69e-02, Avg Return: 0.314, Regret: 0.4930, Entropy: 0.7122 +[2026-01-29T21:28:52.540401Z] Loop 145: Loss: 1.57e-02, Avg Return: 0.312, Regret: 0.4931, Entropy: 0.7118 +[2026-01-29T21:28:53.753575Z] Loop 146: Loss: 1.71e-02, Avg Return: 0.315, Regret: 0.4932, Entropy: 0.7115 +[2026-01-29T21:28:54.959877Z] Loop 147: Loss: 1.74e-02, Avg Return: 0.309, Regret: 0.4932, Entropy: 0.7112 +[2026-01-29T21:28:56.162985Z] Loop 148: Loss: 1.65e-02, Avg Return: 0.313, Regret: 0.4932, Entropy: 0.7112 +[2026-01-29T21:28:57.367774Z] Loop 149: Loss: 1.61e-02, Avg Return: 0.315, Regret: 0.4931, Entropy: 0.7113 +[2026-01-29T21:28:58.575177Z] Loop 150: Loss: 1.75e-02, Avg Return: 0.319, Regret: 0.4931, Entropy: 0.7112 +[2026-01-29T21:28:59.780154Z] Loop 151: Loss: 1.70e-02, Avg Return: 0.314, Regret: 0.4931, Entropy: 0.7110 +[2026-01-29T21:29:00.983652Z] Loop 152: Loss: 1.59e-02, Avg Return: 0.309, Regret: 0.4931, Entropy: 0.7110 +[2026-01-29T21:29:02.196322Z] Loop 153: Loss: 1.76e-02, Avg Return: 0.307, Regret: 0.4931, Entropy: 0.7109 +[2026-01-29T21:29:03.396965Z] Loop 154: Loss: 1.61e-02, Avg Return: 0.302, Regret: 0.4930, Entropy: 0.7110 +[2026-01-29T21:29:04.597869Z] Loop 155: Loss: 1.66e-02, Avg Return: 0.309, Regret: 0.4930, Entropy: 0.7110 +[2026-01-29T21:29:05.797850Z] Loop 156: Loss: 1.67e-02, Avg Return: 0.306, Regret: 0.4930, Entropy: 0.7109 +[2026-01-29T21:29:06.998893Z] Loop 157: Loss: 1.55e-02, Avg Return: 0.308, Regret: 0.4930, Entropy: 0.7108 +[2026-01-29T21:29:08.200558Z] Loop 158: Loss: 1.64e-02, Avg Return: 0.308, Regret: 0.4930, Entropy: 0.7106 +[2026-01-29T21:29:09.400037Z] Loop 159: Loss: 1.73e-02, Avg Return: 0.308, Regret: 0.4930, Entropy: 0.7102 +[2026-01-29T21:29:10.599616Z] Loop 160: Loss: 1.69e-02, Avg Return: 0.306, Regret: 0.4931, Entropy: 0.7097 +[2026-01-29T21:29:11.801730Z] Loop 161: Loss: 1.79e-02, Avg Return: 0.310, Regret: 0.4933, Entropy: 0.7090 +[2026-01-29T21:29:13.004556Z] Loop 162: Loss: 1.83e-02, Avg Return: 0.310, Regret: 0.4935, Entropy: 0.7080 +[2026-01-29T21:29:14.211005Z] Loop 163: Loss: 1.72e-02, Avg Return: 0.309, Regret: 0.4937, Entropy: 0.7072 +[2026-01-29T21:29:15.415199Z] Loop 164: Loss: 1.71e-02, Avg Return: 0.310, Regret: 0.4937, Entropy: 0.7067 +[2026-01-29T21:29:16.619511Z] Loop 165: Loss: 1.64e-02, Avg Return: 0.312, Regret: 0.4937, Entropy: 0.7065 +[2026-01-29T21:29:17.824733Z] Loop 166: Loss: 1.78e-02, Avg Return: 0.317, Regret: 0.4934, Entropy: 0.7072 +[2026-01-29T21:29:19.034186Z] Loop 167: Loss: 1.76e-02, Avg Return: 0.311, Regret: 0.4931, Entropy: 0.7077 +[2026-01-29T21:29:20.239530Z] Loop 168: Loss: 1.66e-02, Avg Return: 0.314, Regret: 0.4929, Entropy: 0.7080 +[2026-01-29T21:29:21.443891Z] Loop 169: Loss: 1.73e-02, Avg Return: 0.311, Regret: 0.4929, Entropy: 0.7077 +[2026-01-29T21:29:22.649634Z] Loop 170: Loss: 1.61e-02, Avg Return: 0.310, Regret: 0.4931, Entropy: 0.7069 +[2026-01-29T21:29:23.855078Z] Loop 171: Loss: 1.79e-02, Avg Return: 0.314, Regret: 0.4933, Entropy: 0.7061 +[2026-01-29T21:29:25.059294Z] Loop 172: Loss: 1.63e-02, Avg Return: 0.316, Regret: 0.4935, Entropy: 0.7054 +[2026-01-29T21:29:26.263199Z] Loop 173: Loss: 1.71e-02, Avg Return: 0.311, Regret: 0.4936, Entropy: 0.7049 +[2026-01-29T21:29:27.467808Z] Loop 174: Loss: 1.68e-02, Avg Return: 0.311, Regret: 0.4937, Entropy: 0.7043 +[2026-01-29T21:29:28.672067Z] Loop 175: Loss: 1.71e-02, Avg Return: 0.310, Regret: 0.4937, Entropy: 0.7041 +[2026-01-29T21:29:29.875974Z] Loop 176: Loss: 1.71e-02, Avg Return: 0.316, Regret: 0.4937, Entropy: 0.7040 +[2026-01-29T21:29:31.079613Z] Loop 177: Loss: 1.77e-02, Avg Return: 0.310, Regret: 0.4935, Entropy: 0.7045 +[2026-01-29T21:29:32.281449Z] Loop 178: Loss: 1.78e-02, Avg Return: 0.301, Regret: 0.4933, Entropy: 0.7050 +[2026-01-29T21:29:33.487344Z] Loop 179: Loss: 1.68e-02, Avg Return: 0.311, Regret: 0.4932, Entropy: 0.7056 +[2026-01-29T21:29:34.692863Z] Loop 180: Loss: 1.61e-02, Avg Return: 0.314, Regret: 0.4930, Entropy: 0.7060 +[2026-01-29T21:29:35.897406Z] Loop 181: Loss: 1.77e-02, Avg Return: 0.316, Regret: 0.4930, Entropy: 0.7063 +[2026-01-29T21:29:37.101596Z] Loop 182: Loss: 1.70e-02, Avg Return: 0.302, Regret: 0.4929, Entropy: 0.7065 +[2026-01-29T21:29:38.309093Z] Loop 183: Loss: 1.72e-02, Avg Return: 0.317, Regret: 0.4929, Entropy: 0.7064 +[2026-01-29T21:29:39.512908Z] Loop 184: Loss: 1.67e-02, Avg Return: 0.311, Regret: 0.4929, Entropy: 0.7061 +[2026-01-29T21:29:40.718329Z] Loop 185: Loss: 1.70e-02, Avg Return: 0.316, Regret: 0.4931, Entropy: 0.7054 +[2026-01-29T21:29:41.922901Z] Loop 186: Loss: 1.65e-02, Avg Return: 0.314, Regret: 0.4933, Entropy: 0.7046 +[2026-01-29T21:29:43.127322Z] Loop 187: Loss: 1.72e-02, Avg Return: 0.311, Regret: 0.4933, Entropy: 0.7042 +[2026-01-29T21:29:44.331556Z] Loop 188: Loss: 1.61e-02, Avg Return: 0.303, Regret: 0.4933, Entropy: 0.7042 +[2026-01-29T21:29:45.536912Z] Loop 189: Loss: 1.71e-02, Avg Return: 0.308, Regret: 0.4932, Entropy: 0.7043 +[2026-01-29T21:29:46.740874Z] Loop 190: Loss: 1.73e-02, Avg Return: 0.313, Regret: 0.4931, Entropy: 0.7047 +[2026-01-29T21:29:47.945962Z] Loop 191: Loss: 1.58e-02, Avg Return: 0.310, Regret: 0.4931, Entropy: 0.7047 +[2026-01-29T21:29:49.149790Z] Loop 192: Loss: 1.60e-02, Avg Return: 0.309, Regret: 0.4929, Entropy: 0.7051 +[2026-01-29T21:29:50.362720Z] Loop 193: Loss: 1.74e-02, Avg Return: 0.313, Regret: 0.4928, Entropy: 0.7052 +[2026-01-29T21:29:51.566985Z] Loop 194: Loss: 1.76e-02, Avg Return: 0.313, Regret: 0.4929, Entropy: 0.7048 +[2026-01-29T21:29:52.772260Z] Loop 195: Loss: 1.80e-02, Avg Return: 0.314, Regret: 0.4931, Entropy: 0.7038 +[2026-01-29T21:29:53.975466Z] Loop 196: Loss: 1.76e-02, Avg Return: 0.313, Regret: 0.4932, Entropy: 0.7032 +[2026-01-29T21:29:55.179459Z] Loop 197: Loss: 1.66e-02, Avg Return: 0.314, Regret: 0.4932, Entropy: 0.7030 +[2026-01-29T21:29:56.384978Z] Loop 198: Loss: 1.64e-02, Avg Return: 0.307, Regret: 0.4932, Entropy: 0.7033 +[2026-01-29T21:29:57.590658Z] Loop 199: Loss: 1.66e-02, Avg Return: 0.301, Regret: 0.4931, Entropy: 0.7037 +[2026-01-29T21:29:58.793726Z] Loop 200: Loss: 1.67e-02, Avg Return: 0.307, Regret: 0.4929, Entropy: 0.7041 +[2026-01-29T21:29:59.996631Z] Loop 201: Loss: 1.78e-02, Avg Return: 0.307, Regret: 0.4929, Entropy: 0.7044 +[2026-01-29T21:30:01.200249Z] Loop 202: Loss: 1.68e-02, Avg Return: 0.315, Regret: 0.4928, Entropy: 0.7046 +[2026-01-29T21:30:02.403782Z] Loop 203: Loss: 1.59e-02, Avg Return: 0.308, Regret: 0.4928, Entropy: 0.7047 +[2026-01-29T21:30:03.606320Z] Loop 204: Loss: 1.74e-02, Avg Return: 0.318, Regret: 0.4929, Entropy: 0.7045 +[2026-01-29T21:30:04.810295Z] Loop 205: Loss: 1.90e-02, Avg Return: 0.311, Regret: 0.4929, Entropy: 0.7043 +[2026-01-29T21:30:06.014226Z] Loop 206: Loss: 1.55e-02, Avg Return: 0.310, Regret: 0.4930, Entropy: 0.7040 +[2026-01-29T21:30:07.217930Z] Loop 207: Loss: 1.73e-02, Avg Return: 0.313, Regret: 0.4930, Entropy: 0.7037 +[2026-01-29T21:30:08.421311Z] Loop 208: Loss: 1.65e-02, Avg Return: 0.312, Regret: 0.4930, Entropy: 0.7037 +[2026-01-29T21:30:09.626374Z] Loop 209: Loss: 1.77e-02, Avg Return: 0.314, Regret: 0.4929, Entropy: 0.7039 +[2026-01-29T21:30:10.828200Z] Loop 210: Loss: 1.72e-02, Avg Return: 0.310, Regret: 0.4929, Entropy: 0.7040 +[2026-01-29T21:30:12.029681Z] Loop 211: Loss: 1.66e-02, Avg Return: 0.314, Regret: 0.4929, Entropy: 0.7042 +[2026-01-29T21:30:13.237866Z] Loop 212: Loss: 1.77e-02, Avg Return: 0.317, Regret: 0.4928, Entropy: 0.7043 +[2026-01-29T21:30:14.442886Z] Loop 213: Loss: 1.77e-02, Avg Return: 0.310, Regret: 0.4928, Entropy: 0.7042 +[2026-01-29T21:30:15.644539Z] Loop 214: Loss: 1.58e-02, Avg Return: 0.311, Regret: 0.4928, Entropy: 0.7040 +[2026-01-29T21:30:16.847343Z] Loop 215: Loss: 1.67e-02, Avg Return: 0.316, Regret: 0.4929, Entropy: 0.7039 +[2026-01-29T21:30:18.048576Z] Loop 216: Loss: 1.62e-02, Avg Return: 0.308, Regret: 0.4929, Entropy: 0.7038 +[2026-01-29T21:30:19.248714Z] Loop 217: Loss: 1.71e-02, Avg Return: 0.306, Regret: 0.4930, Entropy: 0.7035 +[2026-01-29T21:30:20.449584Z] Loop 218: Loss: 1.63e-02, Avg Return: 0.313, Regret: 0.4930, Entropy: 0.7035 +[2026-01-29T21:30:21.651531Z] Loop 219: Loss: 1.69e-02, Avg Return: 0.315, Regret: 0.4930, Entropy: 0.7036 +[2026-01-29T21:30:22.853848Z] Loop 220: Loss: 1.56e-02, Avg Return: 0.312, Regret: 0.4929, Entropy: 0.7037 +[2026-01-29T21:30:24.055142Z] Loop 221: Loss: 1.64e-02, Avg Return: 0.312, Regret: 0.4929, Entropy: 0.7040 +[2026-01-29T21:30:25.259911Z] Loop 222: Loss: 1.68e-02, Avg Return: 0.308, Regret: 0.4928, Entropy: 0.7042 +[2026-01-29T21:30:26.461053Z] Loop 223: Loss: 1.57e-02, Avg Return: 0.310, Regret: 0.4928, Entropy: 0.7043 +[2026-01-29T21:30:27.664252Z] Loop 224: Loss: 1.74e-02, Avg Return: 0.311, Regret: 0.4928, Entropy: 0.7043 +[2026-01-29T21:30:28.868940Z] Loop 225: Loss: 1.53e-02, Avg Return: 0.303, Regret: 0.4928, Entropy: 0.7043 +[2026-01-29T21:30:30.079314Z] Loop 226: Loss: 1.81e-02, Avg Return: 0.319, Regret: 0.4928, Entropy: 0.7043 +[2026-01-29T21:30:31.282091Z] Loop 227: Loss: 1.72e-02, Avg Return: 0.310, Regret: 0.4928, Entropy: 0.7043 +[2026-01-29T21:30:32.486288Z] Loop 228: Loss: 1.69e-02, Avg Return: 0.312, Regret: 0.4928, Entropy: 0.7044 +[2026-01-29T21:30:33.692489Z] Loop 229: Loss: 1.68e-02, Avg Return: 0.305, Regret: 0.4928, Entropy: 0.7045 +[2026-01-29T21:30:34.896877Z] Loop 230: Loss: 1.63e-02, Avg Return: 0.307, Regret: 0.4928, Entropy: 0.7045 +[2026-01-29T21:30:36.102009Z] Loop 231: Loss: 1.69e-02, Avg Return: 0.311, Regret: 0.4928, Entropy: 0.7045 +[2026-01-29T21:30:37.307234Z] Loop 232: Loss: 1.70e-02, Avg Return: 0.310, Regret: 0.4928, Entropy: 0.7045 +[2026-01-29T21:30:38.512289Z] Loop 233: Loss: 1.69e-02, Avg Return: 0.311, Regret: 0.4928, Entropy: 0.7045 +[2026-01-29T21:30:39.717361Z] Loop 234: Loss: 1.71e-02, Avg Return: 0.312, Regret: 0.4929, Entropy: 0.7045 +[2026-01-29T21:30:40.923049Z] Loop 235: Loss: 1.81e-02, Avg Return: 0.315, Regret: 0.4929, Entropy: 0.7043 +[2026-01-29T21:30:42.126509Z] Loop 236: Loss: 1.76e-02, Avg Return: 0.318, Regret: 0.4929, Entropy: 0.7042 +[2026-01-29T21:30:43.329983Z] Loop 237: Loss: 1.63e-02, Avg Return: 0.305, Regret: 0.4929, Entropy: 0.7039 +[2026-01-29T21:30:44.540781Z] Loop 238: Loss: 1.65e-02, Avg Return: 0.307, Regret: 0.4929, Entropy: 0.7037 +[2026-01-29T21:30:45.748378Z] Loop 239: Loss: 1.65e-02, Avg Return: 0.309, Regret: 0.4930, Entropy: 0.7034 +[2026-01-29T21:30:46.953941Z] Loop 240: Loss: 1.64e-02, Avg Return: 0.306, Regret: 0.4930, Entropy: 0.7033 +[2026-01-29T21:30:48.160186Z] Loop 241: Loss: 1.60e-02, Avg Return: 0.308, Regret: 0.4929, Entropy: 0.7032 +[2026-01-29T21:30:49.366220Z] Loop 242: Loss: 1.60e-02, Avg Return: 0.305, Regret: 0.4928, Entropy: 0.7033 +[2026-01-29T21:30:50.568669Z] Loop 243: Loss: 1.57e-02, Avg Return: 0.308, Regret: 0.4928, Entropy: 0.7033 +[2026-01-29T21:30:51.773147Z] Loop 244: Loss: 1.74e-02, Avg Return: 0.309, Regret: 0.4928, Entropy: 0.7031 +[2026-01-29T21:30:52.986618Z] Loop 245: Loss: 1.59e-02, Avg Return: 0.310, Regret: 0.4928, Entropy: 0.7026 +[2026-01-29T21:30:54.200842Z] Loop 246: Loss: 1.74e-02, Avg Return: 0.313, Regret: 0.4930, Entropy: 0.7020 +[2026-01-29T21:30:55.413720Z] Loop 247: Loss: 1.73e-02, Avg Return: 0.309, Regret: 0.4930, Entropy: 0.7017 +[2026-01-29T21:30:56.619365Z] Loop 248: Loss: 1.58e-02, Avg Return: 0.312, Regret: 0.4930, Entropy: 0.7017 +[2026-01-29T21:30:57.825663Z] Loop 249: Loss: 1.70e-02, Avg Return: 0.311, Regret: 0.4930, Entropy: 0.7016 +[2026-01-29T21:30:59.034591Z] Loop 250: Loss: 1.60e-02, Avg Return: 0.314, Regret: 0.4929, Entropy: 0.7018 +[2026-01-29T21:31:00.194898Z] Loop 251: Loss: 1.72e-02, Avg Return: 0.310, Regret: 0.4929, Entropy: 0.7020 +[2026-01-29T21:31:01.398197Z] Loop 252: Loss: 1.70e-02, Avg Return: 0.313, Regret: 0.4928, Entropy: 0.7022 +[2026-01-29T21:31:02.558202Z] Loop 253: Loss: 1.80e-02, Avg Return: 0.315, Regret: 0.4928, Entropy: 0.7021 +[2026-01-29T21:31:03.784660Z] Loop 254: Loss: 1.70e-02, Avg Return: 0.317, Regret: 0.4928, Entropy: 0.7018 +[2026-01-29T21:31:04.949964Z] Loop 255: Loss: 1.66e-02, Avg Return: 0.313, Regret: 0.4928, Entropy: 0.7013 +[2026-01-29T21:31:06.157908Z] Loop 256: Loss: 1.70e-02, Avg Return: 0.308, Regret: 0.4931, Entropy: 0.7007 +[2026-01-29T21:31:07.325273Z] Loop 257: Loss: 1.61e-02, Avg Return: 0.315, Regret: 0.4931, Entropy: 0.7002 +[2026-01-29T21:31:08.530494Z] Loop 258: Loss: 1.65e-02, Avg Return: 0.305, Regret: 0.4930, Entropy: 0.7003 +[2026-01-29T21:31:09.689625Z] Loop 259: Loss: 1.59e-02, Avg Return: 0.307, Regret: 0.4930, Entropy: 0.7005 +[2026-01-29T21:31:10.891889Z] Loop 260: Loss: 1.72e-02, Avg Return: 0.310, Regret: 0.4929, Entropy: 0.7007 +[2026-01-29T21:31:12.056116Z] Loop 261: Loss: 1.65e-02, Avg Return: 0.310, Regret: 0.4929, Entropy: 0.7007 +[2026-01-29T21:31:13.264146Z] Loop 262: Loss: 1.75e-02, Avg Return: 0.311, Regret: 0.4928, Entropy: 0.7008 +[2026-01-29T21:31:14.423734Z] Loop 263: Loss: 1.68e-02, Avg Return: 0.310, Regret: 0.4928, Entropy: 0.7007 +[2026-01-29T21:31:15.625649Z] Loop 264: Loss: 1.65e-02, Avg Return: 0.308, Regret: 0.4927, Entropy: 0.7006 +[2026-01-29T21:31:16.788419Z] Loop 265: Loss: 1.64e-02, Avg Return: 0.313, Regret: 0.4927, Entropy: 0.7005 +[2026-01-29T21:31:18.000584Z] Loop 266: Loss: 1.57e-02, Avg Return: 0.305, Regret: 0.4927, Entropy: 0.7004 +[2026-01-29T21:31:19.159969Z] Loop 267: Loss: 1.65e-02, Avg Return: 0.309, Regret: 0.4927, Entropy: 0.7003 +[2026-01-29T21:31:20.364643Z] Loop 268: Loss: 1.75e-02, Avg Return: 0.311, Regret: 0.4927, Entropy: 0.7002 +[2026-01-29T21:31:21.523281Z] Loop 269: Loss: 1.63e-02, Avg Return: 0.314, Regret: 0.4927, Entropy: 0.7001 +[2026-01-29T21:31:22.724436Z] Loop 270: Loss: 1.70e-02, Avg Return: 0.313, Regret: 0.4927, Entropy: 0.7000 +[2026-01-29T21:31:23.884289Z] Loop 271: Loss: 1.73e-02, Avg Return: 0.313, Regret: 0.4927, Entropy: 0.6998 +[2026-01-29T21:31:25.086713Z] Loop 272: Loss: 1.80e-02, Avg Return: 0.314, Regret: 0.4927, Entropy: 0.6997 +[2026-01-29T21:31:26.245826Z] Loop 273: Loss: 1.70e-02, Avg Return: 0.312, Regret: 0.4927, Entropy: 0.6994 +[2026-01-29T21:31:27.456640Z] Loop 274: Loss: 1.72e-02, Avg Return: 0.311, Regret: 0.4928, Entropy: 0.6992 +[2026-01-29T21:31:28.616527Z] Loop 275: Loss: 1.54e-02, Avg Return: 0.303, Regret: 0.4928, Entropy: 0.6990 +[2026-01-29T21:31:29.837547Z] Loop 276: Loss: 1.63e-02, Avg Return: 0.314, Regret: 0.4929, Entropy: 0.6987 +[2026-01-29T21:31:30.996658Z] Loop 277: Loss: 1.65e-02, Avg Return: 0.305, Regret: 0.4929, Entropy: 0.6987 +[2026-01-29T21:31:32.199258Z] Loop 278: Loss: 1.72e-02, Avg Return: 0.313, Regret: 0.4929, Entropy: 0.6987 +[2026-01-29T21:31:33.359048Z] Loop 279: Loss: 1.73e-02, Avg Return: 0.313, Regret: 0.4929, Entropy: 0.6989 +[2026-01-29T21:31:34.565075Z] Loop 280: Loss: 1.67e-02, Avg Return: 0.311, Regret: 0.4927, Entropy: 0.6992 +[2026-01-29T21:31:35.724808Z] Loop 281: Loss: 1.66e-02, Avg Return: 0.308, Regret: 0.4927, Entropy: 0.6994 +[2026-01-29T21:31:36.934280Z] Loop 282: Loss: 1.66e-02, Avg Return: 0.313, Regret: 0.4927, Entropy: 0.6994 +[2026-01-29T21:31:38.094462Z] Loop 283: Loss: 1.61e-02, Avg Return: 0.306, Regret: 0.4927, Entropy: 0.6991 +[2026-01-29T21:31:39.298047Z] Loop 284: Loss: 1.63e-02, Avg Return: 0.305, Regret: 0.4930, Entropy: 0.6986 +[2026-01-29T21:31:40.457977Z] Loop 285: Loss: 1.68e-02, Avg Return: 0.312, Regret: 0.4930, Entropy: 0.6979 +[2026-01-29T21:31:41.662613Z] Loop 286: Loss: 1.54e-02, Avg Return: 0.313, Regret: 0.4934, Entropy: 0.6974 +[2026-01-29T21:31:42.821995Z] Loop 287: Loss: 1.72e-02, Avg Return: 0.308, Regret: 0.4934, Entropy: 0.6977 +[2026-01-29T21:31:44.026134Z] Loop 288: Loss: 1.70e-02, Avg Return: 0.315, Regret: 0.4931, Entropy: 0.6984 +[2026-01-29T21:31:45.186151Z] Loop 289: Loss: 1.80e-02, Avg Return: 0.314, Regret: 0.4931, Entropy: 0.6990 +[2026-01-29T21:31:46.388020Z] Loop 290: Loss: 1.75e-02, Avg Return: 0.308, Regret: 0.4927, Entropy: 0.6996 +[2026-01-29T21:31:47.546208Z] Loop 291: Loss: 1.83e-02, Avg Return: 0.318, Regret: 0.4927, Entropy: 0.6995 +[2026-01-29T21:31:48.748024Z] Loop 292: Loss: 1.75e-02, Avg Return: 0.310, Regret: 0.4929, Entropy: 0.6989 +[2026-01-29T21:31:49.907886Z] Loop 293: Loss: 1.62e-02, Avg Return: 0.314, Regret: 0.4929, Entropy: 0.6982 +[2026-01-29T21:31:51.111042Z] Loop 294: Loss: 1.67e-02, Avg Return: 0.308, Regret: 0.4933, Entropy: 0.6973 +[2026-01-29T21:31:52.269762Z] Loop 295: Loss: 1.73e-02, Avg Return: 0.312, Regret: 0.4933, Entropy: 0.6964 +[2026-01-29T21:31:53.472158Z] Loop 296: Loss: 1.70e-02, Avg Return: 0.308, Regret: 0.4936, Entropy: 0.6964 +[2026-01-29T21:31:54.630163Z] Loop 297: Loss: 1.63e-02, Avg Return: 0.304, Regret: 0.4936, Entropy: 0.6970 +[2026-01-29T21:31:55.833158Z] Loop 298: Loss: 1.59e-02, Avg Return: 0.308, Regret: 0.4932, Entropy: 0.6979 +[2026-01-29T21:31:56.997764Z] Loop 299: Loss: 1.69e-02, Avg Return: 0.318, Regret: 0.4932, Entropy: 0.6984 +[2026-01-29T21:31:58.206114Z] Loop 300: Loss: 1.63e-02, Avg Return: 0.309, Regret: 0.4929, Entropy: 0.6989 +[2026-01-29T21:31:59.366580Z] Loop 301: Loss: 1.61e-02, Avg Return: 0.305, Regret: 0.4929, Entropy: 0.6995 +[2026-01-29T21:32:00.571575Z] Loop 302: Loss: 1.64e-02, Avg Return: 0.301, Regret: 0.4927, Entropy: 0.6998 +[2026-01-29T21:32:01.729994Z] Loop 303: Loss: 1.58e-02, Avg Return: 0.309, Regret: 0.4927, Entropy: 0.6998 +[2026-01-29T21:32:02.940502Z] Loop 304: Loss: 1.67e-02, Avg Return: 0.309, Regret: 0.4928, Entropy: 0.6995 +[2026-01-29T21:32:04.099819Z] Loop 305: Loss: 1.60e-02, Avg Return: 0.306, Regret: 0.4928, Entropy: 0.6992 +[2026-01-29T21:32:05.304616Z] Loop 306: Loss: 1.72e-02, Avg Return: 0.312, Regret: 0.4930, Entropy: 0.6988 +[2026-01-29T21:32:06.463944Z] Loop 307: Loss: 1.64e-02, Avg Return: 0.310, Regret: 0.4930, Entropy: 0.6986 +[2026-01-29T21:32:07.668005Z] Loop 308: Loss: 1.67e-02, Avg Return: 0.306, Regret: 0.4932, Entropy: 0.6983 +[2026-01-29T21:32:08.827139Z] Loop 309: Loss: 1.65e-02, Avg Return: 0.313, Regret: 0.4932, Entropy: 0.6976 +[2026-01-29T21:32:10.029298Z] Loop 310: Loss: 1.81e-02, Avg Return: 0.313, Regret: 0.4935, Entropy: 0.6972 +[2026-01-29T21:32:11.190053Z] Loop 311: Loss: 1.64e-02, Avg Return: 0.309, Regret: 0.4935, Entropy: 0.6973 +[2026-01-29T21:32:12.394267Z] Loop 312: Loss: 1.67e-02, Avg Return: 0.317, Regret: 0.4933, Entropy: 0.6976 +[2026-01-29T21:32:13.554121Z] Loop 313: Loss: 1.67e-02, Avg Return: 0.309, Regret: 0.4933, Entropy: 0.6985 +[2026-01-29T21:32:14.757910Z] Loop 314: Loss: 1.74e-02, Avg Return: 0.307, Regret: 0.4928, Entropy: 0.6990 +[2026-01-29T21:32:15.923912Z] Loop 315: Loss: 1.65e-02, Avg Return: 0.305, Regret: 0.4928, Entropy: 0.6993 +[2026-01-29T21:32:17.127706Z] Loop 316: Loss: 1.67e-02, Avg Return: 0.308, Regret: 0.4927, Entropy: 0.6991 +[2026-01-29T21:32:18.287361Z] Loop 317: Loss: 1.58e-02, Avg Return: 0.313, Regret: 0.4927, Entropy: 0.6985 +[2026-01-29T21:32:19.493758Z] Loop 318: Loss: 1.66e-02, Avg Return: 0.305, Regret: 0.4930, Entropy: 0.6978 +[2026-01-29T21:32:20.656553Z] Loop 319: Loss: 1.59e-02, Avg Return: 0.308, Regret: 0.4930, Entropy: 0.6967 +[2026-01-29T21:32:21.866241Z] Loop 320: Loss: 1.71e-02, Avg Return: 0.308, Regret: 0.4933, Entropy: 0.6965 +[2026-01-29T21:32:23.025947Z] Loop 321: Loss: 1.72e-02, Avg Return: 0.312, Regret: 0.4933, Entropy: 0.6971 +[2026-01-29T21:32:24.227275Z] Loop 322: Loss: 1.65e-02, Avg Return: 0.311, Regret: 0.4928, Entropy: 0.6981 +[2026-01-29T21:32:25.388293Z] Loop 323: Loss: 1.61e-02, Avg Return: 0.301, Regret: 0.4928, Entropy: 0.6987 +[2026-01-29T21:32:26.599672Z] Loop 324: Loss: 1.75e-02, Avg Return: 0.312, Regret: 0.4927, Entropy: 0.6988 +[2026-01-29T21:32:27.759966Z] Loop 325: Loss: 1.67e-02, Avg Return: 0.310, Regret: 0.4927, Entropy: 0.6986 +[2026-01-29T21:32:28.963720Z] Loop 326: Loss: 1.61e-02, Avg Return: 0.307, Regret: 0.4929, Entropy: 0.6982 +[2026-01-29T21:32:30.123663Z] Loop 327: Loss: 1.66e-02, Avg Return: 0.311, Regret: 0.4929, Entropy: 0.6981 +[2026-01-29T21:32:31.333470Z] Loop 328: Loss: 1.70e-02, Avg Return: 0.317, Regret: 0.4929, Entropy: 0.6980 +[2026-01-29T21:32:32.496703Z] Loop 329: Loss: 1.54e-02, Avg Return: 0.313, Regret: 0.4929, Entropy: 0.6979 +[2026-01-29T21:32:33.710692Z] Loop 330: Loss: 1.73e-02, Avg Return: 0.318, Regret: 0.4929, Entropy: 0.6981 +[2026-01-29T21:32:34.873529Z] Loop 331: Loss: 1.70e-02, Avg Return: 0.309, Regret: 0.4929, Entropy: 0.6984 +[2026-01-29T21:32:36.079734Z] Loop 332: Loss: 1.65e-02, Avg Return: 0.311, Regret: 0.4927, Entropy: 0.6986 +[2026-01-29T21:32:37.237881Z] Loop 333: Loss: 1.74e-02, Avg Return: 0.311, Regret: 0.4927, Entropy: 0.6988 +[2026-01-29T21:32:38.438327Z] Loop 334: Loss: 1.69e-02, Avg Return: 0.309, Regret: 0.4927, Entropy: 0.6986 +[2026-01-29T21:32:39.598380Z] Loop 335: Loss: 1.62e-02, Avg Return: 0.308, Regret: 0.4927, Entropy: 0.6981 +[2026-01-29T21:32:40.804419Z] Loop 336: Loss: 1.74e-02, Avg Return: 0.312, Regret: 0.4929, Entropy: 0.6977 +[2026-01-29T21:32:41.967307Z] Loop 337: Loss: 1.74e-02, Avg Return: 0.323, Regret: 0.4929, Entropy: 0.6973 +[2026-01-29T21:32:43.169928Z] Loop 338: Loss: 1.79e-02, Avg Return: 0.319, Regret: 0.4931, Entropy: 0.6972 +[2026-01-29T21:32:44.328519Z] Loop 339: Loss: 1.63e-02, Avg Return: 0.311, Regret: 0.4931, Entropy: 0.6978 +[2026-01-29T21:32:45.530684Z] Loop 340: Loss: 1.63e-02, Avg Return: 0.308, Regret: 0.4928, Entropy: 0.6983 +[2026-01-29T21:32:46.690487Z] Loop 341: Loss: 1.67e-02, Avg Return: 0.310, Regret: 0.4928, Entropy: 0.6988 +[2026-01-29T21:32:47.896415Z] Loop 342: Loss: 1.71e-02, Avg Return: 0.316, Regret: 0.4926, Entropy: 0.6990 +[2026-01-29T21:32:49.058233Z] Loop 343: Loss: 1.54e-02, Avg Return: 0.306, Regret: 0.4926, Entropy: 0.6989 +[2026-01-29T21:32:50.263272Z] Loop 344: Loss: 1.67e-02, Avg Return: 0.300, Regret: 0.4927, Entropy: 0.6988 +[2026-01-29T21:32:51.423611Z] Loop 345: Loss: 1.75e-02, Avg Return: 0.313, Regret: 0.4927, Entropy: 0.6987 +[2026-01-29T21:32:52.626070Z] Loop 346: Loss: 1.59e-02, Avg Return: 0.308, Regret: 0.4928, Entropy: 0.6987 +[2026-01-29T21:32:53.789114Z] Loop 347: Loss: 1.56e-02, Avg Return: 0.307, Regret: 0.4928, Entropy: 0.6987 +[2026-01-29T21:32:54.991289Z] Loop 348: Loss: 1.57e-02, Avg Return: 0.308, Regret: 0.4927, Entropy: 0.6987 +[2026-01-29T21:32:56.149692Z] Loop 349: Loss: 1.63e-02, Avg Return: 0.312, Regret: 0.4927, Entropy: 0.6988 +[2026-01-29T21:32:57.352101Z] Loop 350: Loss: 1.59e-02, Avg Return: 0.303, Regret: 0.4926, Entropy: 0.6987 +[2026-01-29T21:32:58.511379Z] Loop 351: Loss: 1.63e-02, Avg Return: 0.314, Regret: 0.4926, Entropy: 0.6987 +[2026-01-29T21:32:59.715358Z] Loop 352: Loss: 1.58e-02, Avg Return: 0.307, Regret: 0.4926, Entropy: 0.6986 +[2026-01-29T21:33:00.878855Z] Loop 353: Loss: 1.66e-02, Avg Return: 0.315, Regret: 0.4926, Entropy: 0.6984 +[2026-01-29T21:33:02.092769Z] Loop 354: Loss: 1.67e-02, Avg Return: 0.311, Regret: 0.4927, Entropy: 0.6982 +[2026-01-29T21:33:03.260046Z] Loop 355: Loss: 1.62e-02, Avg Return: 0.306, Regret: 0.4927, Entropy: 0.6979 +[2026-01-29T21:33:04.466718Z] Loop 356: Loss: 1.65e-02, Avg Return: 0.310, Regret: 0.4928, Entropy: 0.6977 +[2026-01-29T21:33:05.629758Z] Loop 357: Loss: 1.67e-02, Avg Return: 0.314, Regret: 0.4928, Entropy: 0.6974 +[2026-01-29T21:33:06.838402Z] Loop 358: Loss: 1.64e-02, Avg Return: 0.309, Regret: 0.4928, Entropy: 0.6976 +[2026-01-29T21:33:07.998941Z] Loop 359: Loss: 1.67e-02, Avg Return: 0.307, Regret: 0.4928, Entropy: 0.6977 +[2026-01-29T21:33:09.199310Z] Loop 360: Loss: 1.69e-02, Avg Return: 0.311, Regret: 0.4927, Entropy: 0.6979 +[2026-01-29T21:33:10.357265Z] Loop 361: Loss: 1.82e-02, Avg Return: 0.312, Regret: 0.4927, Entropy: 0.6981 +[2026-01-29T21:33:11.558590Z] Loop 362: Loss: 1.73e-02, Avg Return: 0.312, Regret: 0.4926, Entropy: 0.6983 +[2026-01-29T21:33:12.721671Z] Loop 363: Loss: 1.58e-02, Avg Return: 0.306, Regret: 0.4926, Entropy: 0.6983 +[2026-01-29T21:33:13.932805Z] Loop 364: Loss: 1.71e-02, Avg Return: 0.314, Regret: 0.4926, Entropy: 0.6983 +[2026-01-29T21:33:15.094788Z] Loop 365: Loss: 1.74e-02, Avg Return: 0.315, Regret: 0.4926, Entropy: 0.6983 +[2026-01-29T21:33:16.306545Z] Loop 366: Loss: 1.72e-02, Avg Return: 0.315, Regret: 0.4926, Entropy: 0.6983 +[2026-01-29T21:33:17.469057Z] Loop 367: Loss: 1.67e-02, Avg Return: 0.310, Regret: 0.4926, Entropy: 0.6983 +[2026-01-29T21:33:18.674164Z] Loop 368: Loss: 1.70e-02, Avg Return: 0.317, Regret: 0.4926, Entropy: 0.6983 +[2026-01-29T21:33:19.838047Z] Loop 369: Loss: 1.60e-02, Avg Return: 0.309, Regret: 0.4926, Entropy: 0.6982 +[2026-01-29T21:33:21.042105Z] Loop 370: Loss: 1.67e-02, Avg Return: 0.311, Regret: 0.4926, Entropy: 0.6982 +[2026-01-29T21:33:22.201872Z] Loop 371: Loss: 1.73e-02, Avg Return: 0.314, Regret: 0.4926, Entropy: 0.6981 +[2026-01-29T21:33:23.407005Z] Loop 372: Loss: 1.61e-02, Avg Return: 0.311, Regret: 0.4927, Entropy: 0.6981 +[2026-01-29T21:33:24.568498Z] Loop 373: Loss: 1.70e-02, Avg Return: 0.309, Regret: 0.4927, Entropy: 0.6982 +[2026-01-29T21:33:25.778341Z] Loop 374: Loss: 1.72e-02, Avg Return: 0.312, Regret: 0.4926, Entropy: 0.6982 +[2026-01-29T21:33:26.938143Z] Loop 375: Loss: 1.76e-02, Avg Return: 0.317, Regret: 0.4926, Entropy: 0.6982 +[2026-01-29T21:33:28.143231Z] Loop 376: Loss: 1.66e-02, Avg Return: 0.310, Regret: 0.4926, Entropy: 0.6982 +[2026-01-29T21:33:29.302888Z] Loop 377: Loss: 1.75e-02, Avg Return: 0.309, Regret: 0.4926, Entropy: 0.6983 +[2026-01-29T21:33:30.506089Z] Loop 378: Loss: 1.66e-02, Avg Return: 0.308, Regret: 0.4926, Entropy: 0.6983 +[2026-01-29T21:33:31.666774Z] Loop 379: Loss: 1.62e-02, Avg Return: 0.311, Regret: 0.4926, Entropy: 0.6983 +[2026-01-29T21:33:32.873616Z] Loop 380: Loss: 1.64e-02, Avg Return: 0.312, Regret: 0.4926, Entropy: 0.6983 +[2026-01-29T21:33:34.035362Z] Loop 381: Loss: 1.70e-02, Avg Return: 0.312, Regret: 0.4926, Entropy: 0.6983 +[2026-01-29T21:33:35.245229Z] Loop 382: Loss: 1.67e-02, Avg Return: 0.311, Regret: 0.4927, Entropy: 0.6983 +[2026-01-29T21:33:36.406985Z] Loop 383: Loss: 1.55e-02, Avg Return: 0.310, Regret: 0.4927, Entropy: 0.6982 +[2026-01-29T21:33:37.620006Z] Loop 384: Loss: 1.76e-02, Avg Return: 0.310, Regret: 0.4927, Entropy: 0.6981 +[2026-01-29T21:33:38.783690Z] Loop 385: Loss: 1.81e-02, Avg Return: 0.317, Regret: 0.4927, Entropy: 0.6978 +[2026-01-29T21:33:39.987645Z] Loop 386: Loss: 1.68e-02, Avg Return: 0.305, Regret: 0.4928, Entropy: 0.6979 +[2026-01-29T21:33:41.146939Z] Loop 387: Loss: 1.59e-02, Avg Return: 0.309, Regret: 0.4928, Entropy: 0.6980 +[2026-01-29T21:33:42.350417Z] Loop 388: Loss: 1.62e-02, Avg Return: 0.306, Regret: 0.4927, Entropy: 0.6982 +[2026-01-29T21:33:43.514784Z] Loop 389: Loss: 1.60e-02, Avg Return: 0.314, Regret: 0.4927, Entropy: 0.6983 +[2026-01-29T21:33:44.721760Z] Loop 390: Loss: 1.66e-02, Avg Return: 0.307, Regret: 0.4927, Entropy: 0.6985 +[2026-01-29T21:33:45.881027Z] Loop 391: Loss: 1.69e-02, Avg Return: 0.311, Regret: 0.4927, Entropy: 0.6986 +[2026-01-29T21:33:47.080833Z] Loop 392: Loss: 1.79e-02, Avg Return: 0.318, Regret: 0.4926, Entropy: 0.6986 +[2026-01-29T21:33:48.239915Z] Loop 393: Loss: 1.71e-02, Avg Return: 0.315, Regret: 0.4926, Entropy: 0.6986 +[2026-01-29T21:33:49.446808Z] Loop 394: Loss: 1.68e-02, Avg Return: 0.315, Regret: 0.4927, Entropy: 0.6985 +[2026-01-29T21:33:50.610429Z] Loop 395: Loss: 1.73e-02, Avg Return: 0.313, Regret: 0.4927, Entropy: 0.6982 +[2026-01-29T21:33:51.813108Z] Loop 396: Loss: 1.51e-02, Avg Return: 0.309, Regret: 0.4928, Entropy: 0.6979 +[2026-01-29T21:33:52.972214Z] Loop 397: Loss: 1.71e-02, Avg Return: 0.313, Regret: 0.4928, Entropy: 0.6978 +[2026-01-29T21:33:54.173074Z] Loop 398: Loss: 1.68e-02, Avg Return: 0.313, Regret: 0.4928, Entropy: 0.6978 +[2026-01-29T21:33:55.332641Z] Loop 399: Loss: 1.57e-02, Avg Return: 0.308, Regret: 0.4928, Entropy: 0.6978 +[2026-01-29T21:33:56.532319Z] Loop 400: Loss: 1.71e-02, Avg Return: 0.312, Regret: 0.4928, Entropy: 0.6980 +[2026-01-29T21:33:57.693835Z] Loop 401: Loss: 1.70e-02, Avg Return: 0.310, Regret: 0.4928, Entropy: 0.6980 +[2026-01-29T21:33:58.901836Z] Loop 402: Loss: 1.66e-02, Avg Return: 0.306, Regret: 0.4927, Entropy: 0.6980 +[2026-01-29T21:34:00.060513Z] Loop 403: Loss: 1.73e-02, Avg Return: 0.315, Regret: 0.4927, Entropy: 0.6981 +[2026-01-29T21:34:01.264608Z] Loop 404: Loss: 1.61e-02, Avg Return: 0.310, Regret: 0.4927, Entropy: 0.6979 +[2026-01-29T21:34:02.424741Z] Loop 405: Loss: 1.54e-02, Avg Return: 0.302, Regret: 0.4927, Entropy: 0.6977 +[2026-01-29T21:34:03.625880Z] Loop 406: Loss: 1.67e-02, Avg Return: 0.313, Regret: 0.4928, Entropy: 0.6976 +[2026-01-29T21:34:04.785609Z] Loop 407: Loss: 1.73e-02, Avg Return: 0.312, Regret: 0.4928, Entropy: 0.6977 +[2026-01-29T21:34:05.986192Z] Loop 408: Loss: 1.66e-02, Avg Return: 0.310, Regret: 0.4927, Entropy: 0.6977 +[2026-01-29T21:34:07.146635Z] Loop 409: Loss: 1.76e-02, Avg Return: 0.315, Regret: 0.4927, Entropy: 0.6978 +[2026-01-29T21:34:08.347446Z] Loop 410: Loss: 1.72e-02, Avg Return: 0.315, Regret: 0.4926, Entropy: 0.6981 +[2026-01-29T21:34:09.509364Z] Loop 411: Loss: 1.59e-02, Avg Return: 0.305, Regret: 0.4926, Entropy: 0.6981 +[2026-01-29T21:34:10.713077Z] Loop 412: Loss: 1.69e-02, Avg Return: 0.314, Regret: 0.4926, Entropy: 0.6980 +[2026-01-29T21:34:11.872693Z] Loop 413: Loss: 1.75e-02, Avg Return: 0.312, Regret: 0.4926, Entropy: 0.6976 +[2026-01-29T21:34:13.073300Z] Loop 414: Loss: 1.69e-02, Avg Return: 0.313, Regret: 0.4929, Entropy: 0.6971 +[2026-01-29T21:34:14.232683Z] Loop 415: Loss: 1.73e-02, Avg Return: 0.313, Regret: 0.4929, Entropy: 0.6963 +[2026-01-29T21:34:15.433931Z] Loop 416: Loss: 1.65e-02, Avg Return: 0.311, Regret: 0.4933, Entropy: 0.6957 +[2026-01-29T21:34:16.593654Z] Loop 417: Loss: 1.56e-02, Avg Return: 0.304, Regret: 0.4933, Entropy: 0.6960 +[2026-01-29T21:34:17.792791Z] Loop 418: Loss: 1.67e-02, Avg Return: 0.307, Regret: 0.4931, Entropy: 0.6962 +[2026-01-29T21:34:18.951587Z] Loop 419: Loss: 1.66e-02, Avg Return: 0.314, Regret: 0.4931, Entropy: 0.6968 +[2026-01-29T21:34:20.152320Z] Loop 420: Loss: 1.53e-02, Avg Return: 0.302, Regret: 0.4927, Entropy: 0.6974 +[2026-01-29T21:34:21.312359Z] Loop 421: Loss: 1.69e-02, Avg Return: 0.316, Regret: 0.4927, Entropy: 0.6975 +[2026-01-29T21:34:22.514996Z] Loop 422: Loss: 1.71e-02, Avg Return: 0.312, Regret: 0.4926, Entropy: 0.6974 +[2026-01-29T21:34:23.678141Z] Loop 423: Loss: 1.60e-02, Avg Return: 0.313, Regret: 0.4926, Entropy: 0.6971 +[2026-01-29T21:34:24.882643Z] Loop 424: Loss: 1.61e-02, Avg Return: 0.309, Regret: 0.4928, Entropy: 0.6963 +[2026-01-29T21:34:26.045582Z] Loop 425: Loss: 1.66e-02, Avg Return: 0.310, Regret: 0.4928, Entropy: 0.6956 +[2026-01-29T21:34:27.248153Z] Loop 426: Loss: 1.63e-02, Avg Return: 0.309, Regret: 0.4932, Entropy: 0.6949 +[2026-01-29T21:34:28.409837Z] Loop 427: Loss: 1.66e-02, Avg Return: 0.311, Regret: 0.4932, Entropy: 0.6949 +[2026-01-29T21:34:29.612089Z] Loop 428: Loss: 1.67e-02, Avg Return: 0.312, Regret: 0.4930, Entropy: 0.6955 +[2026-01-29T21:34:30.771969Z] Loop 429: Loss: 1.71e-02, Avg Return: 0.311, Regret: 0.4930, Entropy: 0.6962 +[2026-01-29T21:34:31.973026Z] Loop 430: Loss: 1.79e-02, Avg Return: 0.310, Regret: 0.4926, Entropy: 0.6968 +[2026-01-29T21:34:33.133189Z] Loop 431: Loss: 1.67e-02, Avg Return: 0.308, Regret: 0.4926, Entropy: 0.6970 +[2026-01-29T21:34:34.333794Z] Loop 432: Loss: 1.70e-02, Avg Return: 0.314, Regret: 0.4926, Entropy: 0.6968 +[2026-01-29T21:34:35.494691Z] Loop 433: Loss: 1.61e-02, Avg Return: 0.307, Regret: 0.4926, Entropy: 0.6961 +[2026-01-29T21:34:36.696180Z] Loop 434: Loss: 1.75e-02, Avg Return: 0.314, Regret: 0.4930, Entropy: 0.6954 +[2026-01-29T21:34:37.857152Z] Loop 435: Loss: 1.73e-02, Avg Return: 0.309, Regret: 0.4930, Entropy: 0.6949 +[2026-01-29T21:34:39.059380Z] Loop 436: Loss: 1.56e-02, Avg Return: 0.308, Regret: 0.4931, Entropy: 0.6950 +[2026-01-29T21:34:40.225214Z] Loop 437: Loss: 1.55e-02, Avg Return: 0.303, Regret: 0.4931, Entropy: 0.6956 +[2026-01-29T21:34:41.432662Z] Loop 438: Loss: 1.80e-02, Avg Return: 0.310, Regret: 0.4927, Entropy: 0.6963 +[2026-01-29T21:34:42.597566Z] Loop 439: Loss: 1.76e-02, Avg Return: 0.310, Regret: 0.4927, Entropy: 0.6966 +[2026-01-29T21:34:43.801837Z] Loop 440: Loss: 1.62e-02, Avg Return: 0.309, Regret: 0.4926, Entropy: 0.6966 +[2026-01-29T21:34:44.966443Z] Loop 441: Loss: 1.67e-02, Avg Return: 0.315, Regret: 0.4926, Entropy: 0.6966 +[2026-01-29T21:34:46.170022Z] Loop 442: Loss: 1.67e-02, Avg Return: 0.317, Regret: 0.4925, Entropy: 0.6966 +[2026-01-29T21:34:47.331098Z] Loop 443: Loss: 1.61e-02, Avg Return: 0.309, Regret: 0.4925, Entropy: 0.6965 +[2026-01-29T21:34:48.531467Z] Loop 444: Loss: 1.61e-02, Avg Return: 0.308, Regret: 0.4925, Entropy: 0.6965 +[2026-01-29T21:34:49.692568Z] Loop 445: Loss: 1.69e-02, Avg Return: 0.312, Regret: 0.4925, Entropy: 0.6965 +[2026-01-29T21:34:50.889337Z] Loop 446: Loss: 1.70e-02, Avg Return: 0.311, Regret: 0.4925, Entropy: 0.6965 +[2026-01-29T21:34:52.048507Z] Loop 447: Loss: 1.78e-02, Avg Return: 0.316, Regret: 0.4925, Entropy: 0.6964 +[2026-01-29T21:34:53.246879Z] Loop 448: Loss: 1.72e-02, Avg Return: 0.312, Regret: 0.4926, Entropy: 0.6964 +[2026-01-29T21:34:54.405099Z] Loop 449: Loss: 1.66e-02, Avg Return: 0.315, Regret: 0.4926, Entropy: 0.6965 +[2026-01-29T21:34:55.604419Z] Loop 450: Loss: 1.73e-02, Avg Return: 0.308, Regret: 0.4926, Entropy: 0.6962 +[2026-01-29T21:34:56.764258Z] Loop 451: Loss: 1.72e-02, Avg Return: 0.310, Regret: 0.4926, Entropy: 0.6958 +[2026-01-29T21:34:57.961033Z] Loop 452: Loss: 1.74e-02, Avg Return: 0.313, Regret: 0.4929, Entropy: 0.6953 +[2026-01-29T21:34:59.119894Z] Loop 453: Loss: 1.76e-02, Avg Return: 0.311, Regret: 0.4929, Entropy: 0.6951 +[2026-01-29T21:35:00.321124Z] Loop 454: Loss: 1.65e-02, Avg Return: 0.307, Regret: 0.4928, Entropy: 0.6954 +[2026-01-29T21:35:01.484800Z] Loop 455: Loss: 1.65e-02, Avg Return: 0.313, Regret: 0.4928, Entropy: 0.6962 +[2026-01-29T21:35:02.683058Z] Loop 456: Loss: 1.82e-02, Avg Return: 0.315, Regret: 0.4925, Entropy: 0.6962 +[2026-01-29T21:35:03.844724Z] Loop 457: Loss: 1.63e-02, Avg Return: 0.312, Regret: 0.4925, Entropy: 0.6957 +[2026-01-29T21:35:05.044140Z] Loop 458: Loss: 1.66e-02, Avg Return: 0.309, Regret: 0.4929, Entropy: 0.6950 +[2026-01-29T21:35:06.207987Z] Loop 459: Loss: 1.66e-02, Avg Return: 0.314, Regret: 0.4929, Entropy: 0.6943 +[2026-01-29T21:35:07.420231Z] Loop 460: Loss: 1.66e-02, Avg Return: 0.315, Regret: 0.4931, Entropy: 0.6940 +[2026-01-29T21:35:08.581628Z] Loop 461: Loss: 1.72e-02, Avg Return: 0.314, Regret: 0.4931, Entropy: 0.6942 +[2026-01-29T21:35:09.789347Z] Loop 462: Loss: 1.74e-02, Avg Return: 0.311, Regret: 0.4929, Entropy: 0.6949 +[2026-01-29T21:35:10.948816Z] Loop 463: Loss: 1.57e-02, Avg Return: 0.303, Regret: 0.4929, Entropy: 0.6958 +[2026-01-29T21:35:12.159451Z] Loop 464: Loss: 1.69e-02, Avg Return: 0.314, Regret: 0.4926, Entropy: 0.6961 +[2026-01-29T21:35:13.331153Z] Loop 465: Loss: 1.68e-02, Avg Return: 0.312, Regret: 0.4926, Entropy: 0.6963 +[2026-01-29T21:35:14.542982Z] Loop 466: Loss: 1.62e-02, Avg Return: 0.311, Regret: 0.4925, Entropy: 0.6963 +[2026-01-29T21:35:15.707963Z] Loop 467: Loss: 1.64e-02, Avg Return: 0.309, Regret: 0.4925, Entropy: 0.6963 +[2026-01-29T21:35:16.917784Z] Loop 468: Loss: 1.67e-02, Avg Return: 0.312, Regret: 0.4925, Entropy: 0.6963 +[2026-01-29T21:35:18.077685Z] Loop 469: Loss: 1.62e-02, Avg Return: 0.312, Regret: 0.4925, Entropy: 0.6963 +[2026-01-29T21:35:19.277943Z] Loop 470: Loss: 1.64e-02, Avg Return: 0.311, Regret: 0.4925, Entropy: 0.6963 +[2026-01-29T21:35:20.438377Z] Loop 471: Loss: 1.76e-02, Avg Return: 0.314, Regret: 0.4925, Entropy: 0.6964 +[2026-01-29T21:35:21.639330Z] Loop 472: Loss: 1.65e-02, Avg Return: 0.313, Regret: 0.4925, Entropy: 0.6963 +[2026-01-29T21:35:22.804993Z] Loop 473: Loss: 1.69e-02, Avg Return: 0.313, Regret: 0.4925, Entropy: 0.6963 +[2026-01-29T21:35:24.014875Z] Loop 474: Loss: 1.73e-02, Avg Return: 0.313, Regret: 0.4925, Entropy: 0.6964 +[2026-01-29T21:35:25.176174Z] Loop 475: Loss: 1.61e-02, Avg Return: 0.313, Regret: 0.4925, Entropy: 0.6964 +[2026-01-29T21:35:26.376274Z] Loop 476: Loss: 1.63e-02, Avg Return: 0.314, Regret: 0.4925, Entropy: 0.6964 +[2026-01-29T21:35:27.537721Z] Loop 477: Loss: 1.64e-02, Avg Return: 0.313, Regret: 0.4925, Entropy: 0.6964 +[2026-01-29T21:35:28.739295Z] Loop 478: Loss: 1.62e-02, Avg Return: 0.313, Regret: 0.4925, Entropy: 0.6964 +[2026-01-29T21:35:29.899777Z] Loop 479: Loss: 1.51e-02, Avg Return: 0.308, Regret: 0.4925, Entropy: 0.6964 +[2026-01-29T21:35:31.108210Z] Loop 480: Loss: 1.60e-02, Avg Return: 0.310, Regret: 0.4925, Entropy: 0.6964 +[2026-01-29T21:35:32.274149Z] Loop 481: Loss: 1.56e-02, Avg Return: 0.313, Regret: 0.4925, Entropy: 0.6964 +[2026-01-29T21:35:33.478991Z] Loop 482: Loss: 1.63e-02, Avg Return: 0.311, Regret: 0.4925, Entropy: 0.6964 +[2026-01-29T21:35:34.638995Z] Loop 483: Loss: 1.75e-02, Avg Return: 0.310, Regret: 0.4925, Entropy: 0.6964 +[2026-01-29T21:35:35.842318Z] Loop 484: Loss: 1.63e-02, Avg Return: 0.317, Regret: 0.4925, Entropy: 0.6964 +[2026-01-29T21:35:37.004353Z] Loop 485: Loss: 1.63e-02, Avg Return: 0.317, Regret: 0.4925, Entropy: 0.6963 +[2026-01-29T21:35:38.207490Z] Loop 486: Loss: 1.55e-02, Avg Return: 0.311, Regret: 0.4926, Entropy: 0.6962 +[2026-01-29T21:35:39.368247Z] Loop 487: Loss: 1.65e-02, Avg Return: 0.317, Regret: 0.4926, Entropy: 0.6961 +[2026-01-29T21:35:40.568264Z] Loop 488: Loss: 1.65e-02, Avg Return: 0.316, Regret: 0.4926, Entropy: 0.6962 +[2026-01-29T21:35:41.727039Z] Loop 489: Loss: 1.61e-02, Avg Return: 0.310, Regret: 0.4926, Entropy: 0.6964 +[2026-01-29T21:35:42.927139Z] Loop 490: Loss: 1.53e-02, Avg Return: 0.305, Regret: 0.4926, Entropy: 0.6963 +[2026-01-29T21:35:44.089652Z] Loop 491: Loss: 1.68e-02, Avg Return: 0.306, Regret: 0.4926, Entropy: 0.6962 +[2026-01-29T21:35:45.291315Z] Loop 492: Loss: 1.70e-02, Avg Return: 0.309, Regret: 0.4927, Entropy: 0.6960 +[2026-01-29T21:35:46.455828Z] Loop 493: Loss: 1.74e-02, Avg Return: 0.305, Regret: 0.4927, Entropy: 0.6958 +[2026-01-29T21:35:47.670078Z] Loop 494: Loss: 1.76e-02, Avg Return: 0.315, Regret: 0.4926, Entropy: 0.6960 +[2026-01-29T21:35:48.833555Z] Loop 495: Loss: 1.53e-02, Avg Return: 0.304, Regret: 0.4926, Entropy: 0.6962 +[2026-01-29T21:35:50.034659Z] Loop 496: Loss: 1.66e-02, Avg Return: 0.316, Regret: 0.4925, Entropy: 0.6963 +[2026-01-29T21:35:51.195254Z] Loop 497: Loss: 1.69e-02, Avg Return: 0.305, Regret: 0.4925, Entropy: 0.6962 +[2026-01-29T21:35:52.396124Z] Loop 498: Loss: 1.60e-02, Avg Return: 0.309, Regret: 0.4926, Entropy: 0.6957 +[2026-01-29T21:35:53.556212Z] Loop 499: Loss: 1.72e-02, Avg Return: 0.308, Regret: 0.4926, Entropy: 0.6946 +[2026-01-29T21:35:54.758599Z] Loop 500: Loss: 1.72e-02, Avg Return: 0.311, Regret: 0.4933, Entropy: 0.6935 +[2026-01-29T21:35:55.918058Z] Loop 501: Loss: 1.71e-02, Avg Return: 0.308, Regret: 0.4933, Entropy: 0.6922 +[2026-01-29T21:35:57.078395Z] Loop 502: Loss: 1.66e-02, Avg Return: 0.313, Regret: 0.4933, Entropy: 0.6915 +[2026-01-29T21:35:58.237323Z] Loop 503: Loss: 1.73e-02, Avg Return: 0.307, Regret: 0.4933, Entropy: 0.6917 +[2026-01-29T21:35:59.396994Z] Loop 504: Loss: 1.72e-02, Avg Return: 0.311, Regret: 0.4933, Entropy: 0.6928 +[2026-01-29T21:36:00.607567Z] Loop 505: Loss: 1.70e-02, Avg Return: 0.315, Regret: 0.4931, Entropy: 0.6945 +[2026-01-29T21:36:01.771190Z] Loop 506: Loss: 1.57e-02, Avg Return: 0.310, Regret: 0.4931, Entropy: 0.6961 +[2026-01-29T21:36:02.932003Z] Loop 507: Loss: 1.63e-02, Avg Return: 0.313, Regret: 0.4931, Entropy: 0.6967 +[2026-01-29T21:36:04.091527Z] Loop 508: Loss: 1.73e-02, Avg Return: 0.306, Regret: 0.4931, Entropy: 0.6964 +[2026-01-29T21:36:05.250675Z] Loop 509: Loss: 1.62e-02, Avg Return: 0.311, Regret: 0.4931, Entropy: 0.6955 +[2026-01-29T21:36:06.450964Z] Loop 510: Loss: 1.73e-02, Avg Return: 0.316, Regret: 0.4932, Entropy: 0.6946 +[2026-01-29T21:36:07.610144Z] Loop 511: Loss: 1.57e-02, Avg Return: 0.307, Regret: 0.4932, Entropy: 0.6944 +[2026-01-29T21:36:08.773454Z] Loop 512: Loss: 1.69e-02, Avg Return: 0.307, Regret: 0.4932, Entropy: 0.6948 +[2026-01-29T21:36:09.933807Z] Loop 513: Loss: 1.72e-02, Avg Return: 0.310, Regret: 0.4932, Entropy: 0.6954 +[2026-01-29T21:36:11.093382Z] Loop 514: Loss: 1.67e-02, Avg Return: 0.314, Regret: 0.4932, Entropy: 0.6962 +[2026-01-29T21:36:12.297615Z] Loop 515: Loss: 1.64e-02, Avg Return: 0.314, Regret: 0.4926, Entropy: 0.6969 +[2026-01-29T21:36:13.458055Z] Loop 516: Loss: 1.70e-02, Avg Return: 0.306, Regret: 0.4926, Entropy: 0.6971 +[2026-01-29T21:36:14.621106Z] Loop 517: Loss: 1.60e-02, Avg Return: 0.307, Regret: 0.4926, Entropy: 0.6966 +[2026-01-29T21:36:15.783197Z] Loop 518: Loss: 1.62e-02, Avg Return: 0.309, Regret: 0.4926, Entropy: 0.6959 +[2026-01-29T21:36:16.943040Z] Loop 519: Loss: 1.63e-02, Avg Return: 0.303, Regret: 0.4926, Entropy: 0.6951 +[2026-01-29T21:36:18.142676Z] Loop 520: Loss: 1.64e-02, Avg Return: 0.308, Regret: 0.4933, Entropy: 0.6943 +[2026-01-29T21:36:19.301780Z] Loop 521: Loss: 1.62e-02, Avg Return: 0.310, Regret: 0.4933, Entropy: 0.6935 +[2026-01-29T21:36:20.461664Z] Loop 522: Loss: 1.65e-02, Avg Return: 0.312, Regret: 0.4933, Entropy: 0.6936 +[2026-01-29T21:36:21.624096Z] Loop 523: Loss: 1.69e-02, Avg Return: 0.310, Regret: 0.4933, Entropy: 0.6940 +[2026-01-29T21:36:22.785477Z] Loop 524: Loss: 1.72e-02, Avg Return: 0.312, Regret: 0.4933, Entropy: 0.6947 +[2026-01-29T21:36:23.994683Z] Loop 525: Loss: 1.63e-02, Avg Return: 0.305, Regret: 0.4928, Entropy: 0.6958 +[2026-01-29T21:36:25.153688Z] Loop 526: Loss: 1.64e-02, Avg Return: 0.312, Regret: 0.4928, Entropy: 0.6966 +[2026-01-29T21:36:26.312024Z] Loop 527: Loss: 1.68e-02, Avg Return: 0.316, Regret: 0.4928, Entropy: 0.6969 +[2026-01-29T21:36:27.470543Z] Loop 528: Loss: 1.60e-02, Avg Return: 0.310, Regret: 0.4928, Entropy: 0.6968 +[2026-01-29T21:36:28.628296Z] Loop 529: Loss: 1.68e-02, Avg Return: 0.310, Regret: 0.4928, Entropy: 0.6962 +[2026-01-29T21:36:29.826731Z] Loop 530: Loss: 1.58e-02, Avg Return: 0.311, Regret: 0.4929, Entropy: 0.6956 +[2026-01-29T21:36:30.985521Z] Loop 531: Loss: 1.63e-02, Avg Return: 0.311, Regret: 0.4929, Entropy: 0.6953 +[2026-01-29T21:36:32.144891Z] Loop 532: Loss: 1.64e-02, Avg Return: 0.310, Regret: 0.4929, Entropy: 0.6948 +[2026-01-29T21:36:33.305583Z] Loop 533: Loss: 1.69e-02, Avg Return: 0.307, Regret: 0.4929, Entropy: 0.6946 +[2026-01-29T21:36:34.464219Z] Loop 534: Loss: 1.61e-02, Avg Return: 0.309, Regret: 0.4929, Entropy: 0.6948 +[2026-01-29T21:36:35.663120Z] Loop 535: Loss: 1.79e-02, Avg Return: 0.306, Regret: 0.4930, Entropy: 0.6949 +[2026-01-29T21:36:36.827842Z] Loop 536: Loss: 1.73e-02, Avg Return: 0.312, Regret: 0.4930, Entropy: 0.6955 +[2026-01-29T21:36:37.987039Z] Loop 537: Loss: 1.66e-02, Avg Return: 0.309, Regret: 0.4930, Entropy: 0.6959 +[2026-01-29T21:36:39.146528Z] Loop 538: Loss: 1.70e-02, Avg Return: 0.308, Regret: 0.4930, Entropy: 0.6960 +[2026-01-29T21:36:40.305502Z] Loop 539: Loss: 1.74e-02, Avg Return: 0.316, Regret: 0.4930, Entropy: 0.6962 +[2026-01-29T21:36:41.513617Z] Loop 540: Loss: 1.75e-02, Avg Return: 0.309, Regret: 0.4925, Entropy: 0.6963 +[2026-01-29T21:36:42.690462Z] Loop 541: Loss: 1.61e-02, Avg Return: 0.309, Regret: 0.4925, Entropy: 0.6964 +[2026-01-29T21:36:43.849771Z] Loop 542: Loss: 1.71e-02, Avg Return: 0.320, Regret: 0.4925, Entropy: 0.6963 +[2026-01-29T21:36:45.012274Z] Loop 543: Loss: 1.77e-02, Avg Return: 0.316, Regret: 0.4925, Entropy: 0.6960 +[2026-01-29T21:36:46.174931Z] Loop 544: Loss: 1.58e-02, Avg Return: 0.311, Regret: 0.4925, Entropy: 0.6955 +[2026-01-29T21:36:47.380795Z] Loop 545: Loss: 1.69e-02, Avg Return: 0.308, Regret: 0.4927, Entropy: 0.6954 +[2026-01-29T21:36:48.542015Z] Loop 546: Loss: 1.66e-02, Avg Return: 0.309, Regret: 0.4927, Entropy: 0.6956 +[2026-01-29T21:36:49.701832Z] Loop 547: Loss: 1.66e-02, Avg Return: 0.310, Regret: 0.4927, Entropy: 0.6958 +[2026-01-29T21:36:50.863839Z] Loop 548: Loss: 1.71e-02, Avg Return: 0.305, Regret: 0.4927, Entropy: 0.6961 +[2026-01-29T21:36:52.032393Z] Loop 549: Loss: 1.69e-02, Avg Return: 0.313, Regret: 0.4927, Entropy: 0.6963 +[2026-01-29T21:36:53.238253Z] Loop 550: Loss: 1.66e-02, Avg Return: 0.305, Regret: 0.4925, Entropy: 0.6961 +[2026-01-29T21:36:54.398920Z] Loop 551: Loss: 1.66e-02, Avg Return: 0.308, Regret: 0.4925, Entropy: 0.6956 +[2026-01-29T21:36:55.559728Z] Loop 552: Loss: 1.67e-02, Avg Return: 0.315, Regret: 0.4925, Entropy: 0.6947 +[2026-01-29T21:36:56.720538Z] Loop 553: Loss: 1.67e-02, Avg Return: 0.316, Regret: 0.4925, Entropy: 0.6940 +[2026-01-29T21:36:57.884679Z] Loop 554: Loss: 1.69e-02, Avg Return: 0.314, Regret: 0.4925, Entropy: 0.6936 +[2026-01-29T21:36:59.103868Z] Loop 555: Loss: 1.71e-02, Avg Return: 0.310, Regret: 0.4933, Entropy: 0.6936 +[2026-01-29T21:37:00.266270Z] Loop 556: Loss: 1.68e-02, Avg Return: 0.314, Regret: 0.4933, Entropy: 0.6943 +[2026-01-29T21:37:01.426905Z] Loop 557: Loss: 1.61e-02, Avg Return: 0.317, Regret: 0.4933, Entropy: 0.6949 +[2026-01-29T21:37:02.585283Z] Loop 558: Loss: 1.65e-02, Avg Return: 0.302, Regret: 0.4933, Entropy: 0.6954 +[2026-01-29T21:37:03.743608Z] Loop 559: Loss: 1.68e-02, Avg Return: 0.309, Regret: 0.4933, Entropy: 0.6959 +[2026-01-29T21:37:04.956315Z] Loop 560: Loss: 1.81e-02, Avg Return: 0.319, Regret: 0.4926, Entropy: 0.6961 +[2026-01-29T21:37:06.123438Z] Loop 561: Loss: 1.65e-02, Avg Return: 0.305, Regret: 0.4926, Entropy: 0.6966 +[2026-01-29T21:37:07.283084Z] Loop 562: Loss: 1.60e-02, Avg Return: 0.319, Regret: 0.4926, Entropy: 0.6967 +[2026-01-29T21:37:08.442098Z] Loop 563: Loss: 1.66e-02, Avg Return: 0.307, Regret: 0.4926, Entropy: 0.6968 +[2026-01-29T21:37:09.601868Z] Loop 564: Loss: 1.78e-02, Avg Return: 0.313, Regret: 0.4926, Entropy: 0.6969 +[2026-01-29T21:37:10.804025Z] Loop 565: Loss: 1.70e-02, Avg Return: 0.314, Regret: 0.4925, Entropy: 0.6970 +[2026-01-29T21:37:11.967863Z] Loop 566: Loss: 1.56e-02, Avg Return: 0.304, Regret: 0.4925, Entropy: 0.6971 +[2026-01-29T21:37:13.134003Z] Loop 567: Loss: 1.62e-02, Avg Return: 0.315, Regret: 0.4925, Entropy: 0.6971 +[2026-01-29T21:37:14.298142Z] Loop 568: Loss: 1.74e-02, Avg Return: 0.316, Regret: 0.4925, Entropy: 0.6971 +[2026-01-29T21:37:15.458273Z] Loop 569: Loss: 1.63e-02, Avg Return: 0.309, Regret: 0.4925, Entropy: 0.6971 +[2026-01-29T21:37:16.660875Z] Loop 570: Loss: 1.63e-02, Avg Return: 0.310, Regret: 0.4925, Entropy: 0.6971 +[2026-01-29T21:37:17.824091Z] Loop 571: Loss: 1.54e-02, Avg Return: 0.309, Regret: 0.4925, Entropy: 0.6972 +[2026-01-29T21:37:18.987632Z] Loop 572: Loss: 1.63e-02, Avg Return: 0.306, Regret: 0.4925, Entropy: 0.6974 +[2026-01-29T21:37:20.150564Z] Loop 573: Loss: 1.62e-02, Avg Return: 0.313, Regret: 0.4925, Entropy: 0.6975 +[2026-01-29T21:37:21.310815Z] Loop 574: Loss: 1.79e-02, Avg Return: 0.304, Regret: 0.4925, Entropy: 0.6976 +[2026-01-29T21:37:22.515924Z] Loop 575: Loss: 1.57e-02, Avg Return: 0.318, Regret: 0.4925, Entropy: 0.6976 +[2026-01-29T21:37:23.675894Z] Loop 576: Loss: 1.61e-02, Avg Return: 0.312, Regret: 0.4925, Entropy: 0.6976 +[2026-01-29T21:37:24.836272Z] Loop 577: Loss: 1.60e-02, Avg Return: 0.310, Regret: 0.4925, Entropy: 0.6976 +[2026-01-29T21:37:25.995379Z] Loop 578: Loss: 1.66e-02, Avg Return: 0.307, Regret: 0.4925, Entropy: 0.6975 +[2026-01-29T21:37:27.155573Z] Loop 579: Loss: 1.71e-02, Avg Return: 0.310, Regret: 0.4925, Entropy: 0.6974 +[2026-01-29T21:37:28.355492Z] Loop 580: Loss: 1.74e-02, Avg Return: 0.312, Regret: 0.4925, Entropy: 0.6974 +[2026-01-29T21:37:29.517345Z] Loop 581: Loss: 1.66e-02, Avg Return: 0.305, Regret: 0.4925, Entropy: 0.6974 +[2026-01-29T21:37:30.681803Z] Loop 582: Loss: 1.70e-02, Avg Return: 0.314, Regret: 0.4925, Entropy: 0.6973 +[2026-01-29T21:37:31.842951Z] Loop 583: Loss: 1.69e-02, Avg Return: 0.309, Regret: 0.4925, Entropy: 0.6973 +[2026-01-29T21:37:33.003003Z] Loop 584: Loss: 1.62e-02, Avg Return: 0.309, Regret: 0.4925, Entropy: 0.6972 +[2026-01-29T21:37:34.207713Z] Loop 585: Loss: 1.70e-02, Avg Return: 0.308, Regret: 0.4925, Entropy: 0.6971 +[2026-01-29T21:37:35.368681Z] Loop 586: Loss: 1.66e-02, Avg Return: 0.312, Regret: 0.4925, Entropy: 0.6969 +[2026-01-29T21:37:36.528780Z] Loop 587: Loss: 1.69e-02, Avg Return: 0.308, Regret: 0.4925, Entropy: 0.6967 +[2026-01-29T21:37:37.687303Z] Loop 588: Loss: 1.75e-02, Avg Return: 0.310, Regret: 0.4925, Entropy: 0.6961 +[2026-01-29T21:37:38.846477Z] Loop 589: Loss: 1.72e-02, Avg Return: 0.318, Regret: 0.4925, Entropy: 0.6955 +[2026-01-29T21:37:40.046858Z] Loop 590: Loss: 1.62e-02, Avg Return: 0.313, Regret: 0.4929, Entropy: 0.6950 +[2026-01-29T21:37:41.206554Z] Loop 591: Loss: 1.65e-02, Avg Return: 0.305, Regret: 0.4929, Entropy: 0.6951 +[2026-01-29T21:37:42.365898Z] Loop 592: Loss: 1.56e-02, Avg Return: 0.311, Regret: 0.4929, Entropy: 0.6952 +[2026-01-29T21:37:43.526208Z] Loop 593: Loss: 1.65e-02, Avg Return: 0.315, Regret: 0.4929, Entropy: 0.6949 +[2026-01-29T21:37:44.685186Z] Loop 594: Loss: 1.77e-02, Avg Return: 0.316, Regret: 0.4929, Entropy: 0.6950 +[2026-01-29T21:37:45.886565Z] Loop 595: Loss: 1.75e-02, Avg Return: 0.312, Regret: 0.4929, Entropy: 0.6949 +[2026-01-29T21:37:47.045872Z] Loop 596: Loss: 1.69e-02, Avg Return: 0.312, Regret: 0.4929, Entropy: 0.6948 +[2026-01-29T21:37:48.208305Z] Loop 597: Loss: 1.53e-02, Avg Return: 0.307, Regret: 0.4929, Entropy: 0.6954 +[2026-01-29T21:37:49.368561Z] Loop 598: Loss: 1.83e-02, Avg Return: 0.322, Regret: 0.4929, Entropy: 0.6959 +[2026-01-29T21:37:50.529251Z] Loop 599: Loss: 1.61e-02, Avg Return: 0.307, Regret: 0.4929, Entropy: 0.6963 +[2026-01-29T21:37:51.732331Z] Loop 600: Loss: 1.50e-02, Avg Return: 0.307, Regret: 0.4924, Entropy: 0.6964 +[2026-01-29T21:37:52.893696Z] Loop 601: Loss: 1.61e-02, Avg Return: 0.306, Regret: 0.4924, Entropy: 0.6964 +[2026-01-29T21:37:54.054034Z] Loop 602: Loss: 1.61e-02, Avg Return: 0.309, Regret: 0.4924, Entropy: 0.6963 +[2026-01-29T21:37:55.214847Z] Loop 603: Loss: 1.71e-02, Avg Return: 0.316, Regret: 0.4924, Entropy: 0.6960 +[2026-01-29T21:37:56.374541Z] Loop 604: Loss: 1.73e-02, Avg Return: 0.315, Regret: 0.4924, Entropy: 0.6956 +[2026-01-29T21:37:57.575844Z] Loop 605: Loss: 1.72e-02, Avg Return: 0.312, Regret: 0.4926, Entropy: 0.6956 +[2026-01-29T21:37:58.734971Z] Loop 606: Loss: 1.60e-02, Avg Return: 0.310, Regret: 0.4926, Entropy: 0.6956 +[2026-01-29T21:37:59.895281Z] Loop 607: Loss: 1.61e-02, Avg Return: 0.312, Regret: 0.4926, Entropy: 0.6959 +[2026-01-29T21:38:01.054477Z] Loop 608: Loss: 1.66e-02, Avg Return: 0.310, Regret: 0.4926, Entropy: 0.6962 +[2026-01-29T21:38:02.214536Z] Loop 609: Loss: 1.77e-02, Avg Return: 0.317, Regret: 0.4926, Entropy: 0.6963 +[2026-01-29T21:38:03.413689Z] Loop 610: Loss: 1.74e-02, Avg Return: 0.313, Regret: 0.4924, Entropy: 0.6961 +[2026-01-29T21:38:04.577743Z] Loop 611: Loss: 1.77e-02, Avg Return: 0.313, Regret: 0.4924, Entropy: 0.6956 +[2026-01-29T21:38:05.736973Z] Loop 612: Loss: 1.66e-02, Avg Return: 0.306, Regret: 0.4924, Entropy: 0.6951 +[2026-01-29T21:38:06.897962Z] Loop 613: Loss: 1.71e-02, Avg Return: 0.310, Regret: 0.4924, Entropy: 0.6952 +[2026-01-29T21:38:08.058769Z] Loop 614: Loss: 1.54e-02, Avg Return: 0.311, Regret: 0.4924, Entropy: 0.6958 +[2026-01-29T21:38:09.261688Z] Loop 615: Loss: 1.62e-02, Avg Return: 0.302, Regret: 0.4924, Entropy: 0.6964 +[2026-01-29T21:38:10.422529Z] Loop 616: Loss: 1.64e-02, Avg Return: 0.309, Regret: 0.4924, Entropy: 0.6966 +[2026-01-29T21:38:11.585466Z] Loop 617: Loss: 1.67e-02, Avg Return: 0.303, Regret: 0.4924, Entropy: 0.6966 +[2026-01-29T21:38:12.744520Z] Loop 618: Loss: 1.71e-02, Avg Return: 0.309, Regret: 0.4924, Entropy: 0.6964 +[2026-01-29T21:38:13.904856Z] Loop 619: Loss: 1.64e-02, Avg Return: 0.310, Regret: 0.4924, Entropy: 0.6962 +[2026-01-29T21:38:15.107100Z] Loop 620: Loss: 1.87e-02, Avg Return: 0.318, Regret: 0.4925, Entropy: 0.6961 +[2026-01-29T21:38:16.268225Z] Loop 621: Loss: 1.65e-02, Avg Return: 0.310, Regret: 0.4925, Entropy: 0.6962 +[2026-01-29T21:38:17.427913Z] Loop 622: Loss: 1.59e-02, Avg Return: 0.309, Regret: 0.4925, Entropy: 0.6964 +[2026-01-29T21:38:18.587406Z] Loop 623: Loss: 1.65e-02, Avg Return: 0.309, Regret: 0.4925, Entropy: 0.6965 +[2026-01-29T21:38:19.746005Z] Loop 624: Loss: 1.64e-02, Avg Return: 0.309, Regret: 0.4925, Entropy: 0.6964 +[2026-01-29T21:38:20.947153Z] Loop 625: Loss: 1.59e-02, Avg Return: 0.316, Regret: 0.4925, Entropy: 0.6959 +[2026-01-29T21:38:22.107655Z] Loop 626: Loss: 1.67e-02, Avg Return: 0.309, Regret: 0.4925, Entropy: 0.6954 +[2026-01-29T21:38:23.268236Z] Loop 627: Loss: 1.73e-02, Avg Return: 0.311, Regret: 0.4925, Entropy: 0.6950 +[2026-01-29T21:38:24.427863Z] Loop 628: Loss: 1.67e-02, Avg Return: 0.313, Regret: 0.4925, Entropy: 0.6952 +[2026-01-29T21:38:25.588002Z] Loop 629: Loss: 1.66e-02, Avg Return: 0.307, Regret: 0.4925, Entropy: 0.6955 +[2026-01-29T21:38:26.789083Z] Loop 630: Loss: 1.63e-02, Avg Return: 0.307, Regret: 0.4924, Entropy: 0.6960 +[2026-01-29T21:38:27.951000Z] Loop 631: Loss: 1.66e-02, Avg Return: 0.312, Regret: 0.4924, Entropy: 0.6963 +[2026-01-29T21:38:29.111888Z] Loop 632: Loss: 1.76e-02, Avg Return: 0.320, Regret: 0.4924, Entropy: 0.6962 +[2026-01-29T21:38:30.272522Z] Loop 633: Loss: 1.48e-02, Avg Return: 0.307, Regret: 0.4924, Entropy: 0.6958 +[2026-01-29T21:38:31.432782Z] Loop 634: Loss: 1.64e-02, Avg Return: 0.316, Regret: 0.4924, Entropy: 0.6955 +[2026-01-29T21:38:32.642897Z] Loop 635: Loss: 1.67e-02, Avg Return: 0.322, Regret: 0.4926, Entropy: 0.6952 +[2026-01-29T21:38:33.802763Z] Loop 636: Loss: 1.59e-02, Avg Return: 0.308, Regret: 0.4926, Entropy: 0.6950 +[2026-01-29T21:38:34.963516Z] Loop 637: Loss: 1.62e-02, Avg Return: 0.308, Regret: 0.4926, Entropy: 0.6950 +[2026-01-29T21:38:36.123021Z] Loop 638: Loss: 1.60e-02, Avg Return: 0.305, Regret: 0.4926, Entropy: 0.6951 +[2026-01-29T21:38:37.282676Z] Loop 639: Loss: 1.65e-02, Avg Return: 0.315, Regret: 0.4926, Entropy: 0.6954 +[2026-01-29T21:38:38.485180Z] Loop 640: Loss: 1.56e-02, Avg Return: 0.307, Regret: 0.4924, Entropy: 0.6957 +[2026-01-29T21:38:39.646091Z] Loop 641: Loss: 1.80e-02, Avg Return: 0.310, Regret: 0.4924, Entropy: 0.6957 +[2026-01-29T21:38:40.806315Z] Loop 642: Loss: 1.64e-02, Avg Return: 0.315, Regret: 0.4924, Entropy: 0.6958 +[2026-01-29T21:38:41.967517Z] Loop 643: Loss: 1.72e-02, Avg Return: 0.312, Regret: 0.4924, Entropy: 0.6956 +[2026-01-29T21:38:43.130409Z] Loop 644: Loss: 1.62e-02, Avg Return: 0.311, Regret: 0.4924, Entropy: 0.6950 +[2026-01-29T21:38:44.332970Z] Loop 645: Loss: 1.72e-02, Avg Return: 0.318, Regret: 0.4929, Entropy: 0.6936 +[2026-01-29T21:38:45.492473Z] Loop 646: Loss: 1.77e-02, Avg Return: 0.307, Regret: 0.4929, Entropy: 0.6923 +[2026-01-29T21:38:46.651784Z] Loop 647: Loss: 1.55e-02, Avg Return: 0.307, Regret: 0.4929, Entropy: 0.6922 +[2026-01-29T21:38:47.812141Z] Loop 648: Loss: 1.61e-02, Avg Return: 0.306, Regret: 0.4929, Entropy: 0.6926 +[2026-01-29T21:38:48.973135Z] Loop 649: Loss: 1.67e-02, Avg Return: 0.310, Regret: 0.4929, Entropy: 0.6930 +[2026-01-29T21:38:50.178196Z] Loop 650: Loss: 1.60e-02, Avg Return: 0.309, Regret: 0.4928, Entropy: 0.6937 +[2026-01-29T21:38:51.337101Z] Loop 651: Loss: 1.58e-02, Avg Return: 0.305, Regret: 0.4928, Entropy: 0.6946 +[2026-01-29T21:38:52.496625Z] Loop 652: Loss: 1.77e-02, Avg Return: 0.323, Regret: 0.4928, Entropy: 0.6950 +[2026-01-29T21:38:53.657433Z] Loop 653: Loss: 1.46e-02, Avg Return: 0.310, Regret: 0.4928, Entropy: 0.6953 +[2026-01-29T21:38:54.818408Z] Loop 654: Loss: 1.69e-02, Avg Return: 0.308, Regret: 0.4928, Entropy: 0.6954 +[2026-01-29T21:38:56.019888Z] Loop 655: Loss: 1.66e-02, Avg Return: 0.311, Regret: 0.4923, Entropy: 0.6955 +[2026-01-29T21:38:57.180150Z] Loop 656: Loss: 1.55e-02, Avg Return: 0.311, Regret: 0.4923, Entropy: 0.6954 +[2026-01-29T21:38:58.339480Z] Loop 657: Loss: 1.62e-02, Avg Return: 0.312, Regret: 0.4923, Entropy: 0.6954 +[2026-01-29T21:38:59.500752Z] Loop 658: Loss: 1.67e-02, Avg Return: 0.316, Regret: 0.4923, Entropy: 0.6952 +[2026-01-29T21:39:00.660665Z] Loop 659: Loss: 1.70e-02, Avg Return: 0.317, Regret: 0.4923, Entropy: 0.6950 +[2026-01-29T21:39:01.862383Z] Loop 660: Loss: 1.58e-02, Avg Return: 0.308, Regret: 0.4924, Entropy: 0.6949 +[2026-01-29T21:39:03.021527Z] Loop 661: Loss: 1.62e-02, Avg Return: 0.308, Regret: 0.4924, Entropy: 0.6949 +[2026-01-29T21:39:04.179953Z] Loop 662: Loss: 1.74e-02, Avg Return: 0.312, Regret: 0.4924, Entropy: 0.6948 +[2026-01-29T21:39:05.340935Z] Loop 663: Loss: 1.56e-02, Avg Return: 0.307, Regret: 0.4924, Entropy: 0.6949 +[2026-01-29T21:39:06.509735Z] Loop 664: Loss: 1.68e-02, Avg Return: 0.311, Regret: 0.4924, Entropy: 0.6950 +[2026-01-29T21:39:07.729083Z] Loop 665: Loss: 1.60e-02, Avg Return: 0.307, Regret: 0.4923, Entropy: 0.6950 +[2026-01-29T21:39:08.890742Z] Loop 666: Loss: 1.60e-02, Avg Return: 0.310, Regret: 0.4923, Entropy: 0.6950 +[2026-01-29T21:39:10.050093Z] Loop 667: Loss: 1.62e-02, Avg Return: 0.312, Regret: 0.4923, Entropy: 0.6949 +[2026-01-29T21:39:11.209799Z] Loop 668: Loss: 1.60e-02, Avg Return: 0.313, Regret: 0.4923, Entropy: 0.6949 +[2026-01-29T21:39:12.368878Z] Loop 669: Loss: 1.82e-02, Avg Return: 0.320, Regret: 0.4923, Entropy: 0.6949 +[2026-01-29T21:39:13.577375Z] Loop 670: Loss: 1.66e-02, Avg Return: 0.310, Regret: 0.4923, Entropy: 0.6949 +[2026-01-29T21:39:14.744926Z] Loop 671: Loss: 1.61e-02, Avg Return: 0.304, Regret: 0.4923, Entropy: 0.6949 +[2026-01-29T21:39:15.911774Z] Loop 672: Loss: 1.55e-02, Avg Return: 0.311, Regret: 0.4923, Entropy: 0.6949 +[2026-01-29T21:39:17.074298Z] Loop 673: Loss: 1.65e-02, Avg Return: 0.311, Regret: 0.4923, Entropy: 0.6947 +[2026-01-29T21:39:18.234674Z] Loop 674: Loss: 1.58e-02, Avg Return: 0.314, Regret: 0.4923, Entropy: 0.6946 +[2026-01-29T21:39:19.441019Z] Loop 675: Loss: 1.59e-02, Avg Return: 0.309, Regret: 0.4923, Entropy: 0.6947 +[2026-01-29T21:39:20.600970Z] Loop 676: Loss: 1.64e-02, Avg Return: 0.308, Regret: 0.4923, Entropy: 0.6949 +[2026-01-29T21:39:21.760572Z] Loop 677: Loss: 1.66e-02, Avg Return: 0.312, Regret: 0.4923, Entropy: 0.6949 +[2026-01-29T21:39:22.919598Z] Loop 678: Loss: 1.64e-02, Avg Return: 0.316, Regret: 0.4923, Entropy: 0.6949 +[2026-01-29T21:39:24.081898Z] Loop 679: Loss: 1.75e-02, Avg Return: 0.307, Regret: 0.4923, Entropy: 0.6949 +[2026-01-29T21:39:25.294638Z] Loop 680: Loss: 1.71e-02, Avg Return: 0.315, Regret: 0.4922, Entropy: 0.6949 +[2026-01-29T21:39:26.455958Z] Loop 681: Loss: 1.66e-02, Avg Return: 0.311, Regret: 0.4922, Entropy: 0.6949 +[2026-01-29T21:39:27.615643Z] Loop 682: Loss: 1.60e-02, Avg Return: 0.316, Regret: 0.4922, Entropy: 0.6949 +[2026-01-29T21:39:28.775900Z] Loop 683: Loss: 1.80e-02, Avg Return: 0.319, Regret: 0.4922, Entropy: 0.6948 +[2026-01-29T21:39:29.934788Z] Loop 684: Loss: 1.66e-02, Avg Return: 0.308, Regret: 0.4922, Entropy: 0.6946 +[2026-01-29T21:39:31.135966Z] Loop 685: Loss: 1.62e-02, Avg Return: 0.308, Regret: 0.4923, Entropy: 0.6945 +[2026-01-29T21:39:32.294768Z] Loop 686: Loss: 1.64e-02, Avg Return: 0.311, Regret: 0.4923, Entropy: 0.6946 +[2026-01-29T21:39:33.454418Z] Loop 687: Loss: 1.71e-02, Avg Return: 0.309, Regret: 0.4923, Entropy: 0.6946 +[2026-01-29T21:39:34.614216Z] Loop 688: Loss: 1.66e-02, Avg Return: 0.315, Regret: 0.4923, Entropy: 0.6949 +[2026-01-29T21:39:35.773568Z] Loop 689: Loss: 1.65e-02, Avg Return: 0.307, Regret: 0.4923, Entropy: 0.6949 +[2026-01-29T21:39:36.984048Z] Loop 690: Loss: 1.66e-02, Avg Return: 0.312, Regret: 0.4922, Entropy: 0.6949 +[2026-01-29T21:39:38.146171Z] Loop 691: Loss: 1.76e-02, Avg Return: 0.312, Regret: 0.4922, Entropy: 0.6948 +[2026-01-29T21:39:39.307658Z] Loop 692: Loss: 1.68e-02, Avg Return: 0.315, Regret: 0.4922, Entropy: 0.6948 +[2026-01-29T21:39:40.469014Z] Loop 693: Loss: 1.66e-02, Avg Return: 0.310, Regret: 0.4922, Entropy: 0.6948 +[2026-01-29T21:39:41.629696Z] Loop 694: Loss: 1.77e-02, Avg Return: 0.309, Regret: 0.4922, Entropy: 0.6948 +[2026-01-29T21:39:42.831396Z] Loop 695: Loss: 1.68e-02, Avg Return: 0.312, Regret: 0.4922, Entropy: 0.6948 +[2026-01-29T21:39:43.990915Z] Loop 696: Loss: 1.64e-02, Avg Return: 0.312, Regret: 0.4922, Entropy: 0.6947 +[2026-01-29T21:39:45.150550Z] Loop 697: Loss: 1.68e-02, Avg Return: 0.309, Regret: 0.4922, Entropy: 0.6944 +[2026-01-29T21:39:46.310408Z] Loop 698: Loss: 1.67e-02, Avg Return: 0.306, Regret: 0.4922, Entropy: 0.6937 +[2026-01-29T21:39:47.470696Z] Loop 699: Loss: 1.68e-02, Avg Return: 0.307, Regret: 0.4922, Entropy: 0.6927 +[2026-01-29T21:39:48.674423Z] Loop 700: Loss: 1.71e-02, Avg Return: 0.315, Regret: 0.4929, Entropy: 0.6921 +[2026-01-29T21:39:49.836016Z] Loop 701: Loss: 1.66e-02, Avg Return: 0.314, Regret: 0.4929, Entropy: 0.6924 +[2026-01-29T21:39:50.995618Z] Loop 702: Loss: 1.69e-02, Avg Return: 0.311, Regret: 0.4929, Entropy: 0.6932 +[2026-01-29T21:39:52.158873Z] Loop 703: Loss: 1.69e-02, Avg Return: 0.311, Regret: 0.4929, Entropy: 0.6938 +[2026-01-29T21:39:53.319194Z] Loop 704: Loss: 1.63e-02, Avg Return: 0.308, Regret: 0.4929, Entropy: 0.6944 +[2026-01-29T21:39:54.526793Z] Loop 705: Loss: 1.58e-02, Avg Return: 0.309, Regret: 0.4921, Entropy: 0.6947 +[2026-01-29T21:39:55.688856Z] Loop 706: Loss: 1.64e-02, Avg Return: 0.312, Regret: 0.4921, Entropy: 0.6947 +[2026-01-29T21:39:56.848974Z] Loop 707: Loss: 1.63e-02, Avg Return: 0.314, Regret: 0.4921, Entropy: 0.6944 +[2026-01-29T21:39:58.010192Z] Loop 708: Loss: 1.64e-02, Avg Return: 0.312, Regret: 0.4921, Entropy: 0.6941 +[2026-01-29T21:39:59.170460Z] Loop 709: Loss: 1.53e-02, Avg Return: 0.307, Regret: 0.4921, Entropy: 0.6936 +[2026-01-29T21:40:00.371992Z] Loop 710: Loss: 1.69e-02, Avg Return: 0.316, Regret: 0.4926, Entropy: 0.6932 +[2026-01-29T21:40:01.532651Z] Loop 711: Loss: 1.60e-02, Avg Return: 0.313, Regret: 0.4926, Entropy: 0.6936 +[2026-01-29T21:40:02.692568Z] Loop 712: Loss: 1.66e-02, Avg Return: 0.309, Regret: 0.4926, Entropy: 0.6939 +[2026-01-29T21:40:03.852575Z] Loop 713: Loss: 1.65e-02, Avg Return: 0.310, Regret: 0.4926, Entropy: 0.6943 +[2026-01-29T21:40:05.012420Z] Loop 714: Loss: 1.64e-02, Avg Return: 0.309, Regret: 0.4926, Entropy: 0.6946 +[2026-01-29T21:40:06.214091Z] Loop 715: Loss: 1.57e-02, Avg Return: 0.310, Regret: 0.4921, Entropy: 0.6944 +[2026-01-29T21:40:07.375014Z] Loop 716: Loss: 1.78e-02, Avg Return: 0.313, Regret: 0.4921, Entropy: 0.6930 +[2026-01-29T21:40:08.534124Z] Loop 717: Loss: 1.71e-02, Avg Return: 0.312, Regret: 0.4921, Entropy: 0.6917 +[2026-01-29T21:40:09.693943Z] Loop 718: Loss: 1.55e-02, Avg Return: 0.308, Regret: 0.4921, Entropy: 0.6923 +[2026-01-29T21:40:10.852598Z] Loop 719: Loss: 1.57e-02, Avg Return: 0.309, Regret: 0.4921, Entropy: 0.6931 +[2026-01-29T21:40:12.054322Z] Loop 720: Loss: 1.74e-02, Avg Return: 0.315, Regret: 0.4923, Entropy: 0.6939 +[2026-01-29T21:40:13.214030Z] Loop 721: Loss: 1.67e-02, Avg Return: 0.312, Regret: 0.4923, Entropy: 0.6945 +[2026-01-29T21:40:14.375111Z] Loop 722: Loss: 1.67e-02, Avg Return: 0.313, Regret: 0.4923, Entropy: 0.6949 +[2026-01-29T21:40:15.533798Z] Loop 723: Loss: 1.52e-02, Avg Return: 0.311, Regret: 0.4923, Entropy: 0.6949 +[2026-01-29T21:40:16.693931Z] Loop 724: Loss: 1.66e-02, Avg Return: 0.309, Regret: 0.4923, Entropy: 0.6949 +[2026-01-29T21:40:17.899021Z] Loop 725: Loss: 1.63e-02, Avg Return: 0.315, Regret: 0.4921, Entropy: 0.6949 +[2026-01-29T21:40:19.059801Z] Loop 726: Loss: 1.61e-02, Avg Return: 0.312, Regret: 0.4921, Entropy: 0.6950 +[2026-01-29T21:40:20.218825Z] Loop 727: Loss: 1.70e-02, Avg Return: 0.315, Regret: 0.4921, Entropy: 0.6950 +[2026-01-29T21:40:21.381055Z] Loop 728: Loss: 1.70e-02, Avg Return: 0.313, Regret: 0.4921, Entropy: 0.6947 +[2026-01-29T21:40:22.541951Z] Loop 729: Loss: 1.71e-02, Avg Return: 0.318, Regret: 0.4921, Entropy: 0.6946 +[2026-01-29T21:40:23.746629Z] Loop 730: Loss: 1.73e-02, Avg Return: 0.308, Regret: 0.4922, Entropy: 0.6944 +[2026-01-29T21:40:24.907264Z] Loop 731: Loss: 1.76e-02, Avg Return: 0.316, Regret: 0.4922, Entropy: 0.6940 +[2026-01-29T21:40:26.066683Z] Loop 732: Loss: 1.67e-02, Avg Return: 0.310, Regret: 0.4922, Entropy: 0.6935 +[2026-01-29T21:40:27.231654Z] Loop 733: Loss: 1.59e-02, Avg Return: 0.313, Regret: 0.4922, Entropy: 0.6934 +[2026-01-29T21:40:28.392573Z] Loop 734: Loss: 1.68e-02, Avg Return: 0.312, Regret: 0.4922, Entropy: 0.6939 +[2026-01-29T21:40:29.597848Z] Loop 735: Loss: 1.74e-02, Avg Return: 0.313, Regret: 0.4921, Entropy: 0.6944 +[2026-01-29T21:40:30.758396Z] Loop 736: Loss: 1.69e-02, Avg Return: 0.309, Regret: 0.4921, Entropy: 0.6947 +[2026-01-29T21:40:31.917647Z] Loop 737: Loss: 1.67e-02, Avg Return: 0.316, Regret: 0.4921, Entropy: 0.6948 +[2026-01-29T21:40:33.077550Z] Loop 738: Loss: 1.66e-02, Avg Return: 0.310, Regret: 0.4921, Entropy: 0.6947 +[2026-01-29T21:40:34.236840Z] Loop 739: Loss: 1.68e-02, Avg Return: 0.314, Regret: 0.4921, Entropy: 0.6947 +[2026-01-29T21:40:35.438902Z] Loop 740: Loss: 1.66e-02, Avg Return: 0.306, Regret: 0.4920, Entropy: 0.6947 +[2026-01-29T21:40:36.598441Z] Loop 741: Loss: 1.66e-02, Avg Return: 0.316, Regret: 0.4920, Entropy: 0.6948 +[2026-01-29T21:40:37.759075Z] Loop 742: Loss: 1.76e-02, Avg Return: 0.310, Regret: 0.4920, Entropy: 0.6948 +[2026-01-29T21:40:38.918392Z] Loop 743: Loss: 1.59e-02, Avg Return: 0.311, Regret: 0.4920, Entropy: 0.6947 +[2026-01-29T21:40:40.078357Z] Loop 744: Loss: 1.68e-02, Avg Return: 0.304, Regret: 0.4920, Entropy: 0.6947 +[2026-01-29T21:40:41.278925Z] Loop 745: Loss: 1.70e-02, Avg Return: 0.308, Regret: 0.4920, Entropy: 0.6947 +[2026-01-29T21:40:42.440055Z] Loop 746: Loss: 1.51e-02, Avg Return: 0.308, Regret: 0.4920, Entropy: 0.6946 +[2026-01-29T21:40:43.599832Z] Loop 747: Loss: 1.66e-02, Avg Return: 0.312, Regret: 0.4920, Entropy: 0.6944 +[2026-01-29T21:40:44.760695Z] Loop 748: Loss: 1.61e-02, Avg Return: 0.318, Regret: 0.4920, Entropy: 0.6943 +[2026-01-29T21:40:45.919886Z] Loop 749: Loss: 1.68e-02, Avg Return: 0.311, Regret: 0.4920, Entropy: 0.6943 +[2026-01-29T21:40:47.123130Z] Loop 750: Loss: 1.68e-02, Avg Return: 0.313, Regret: 0.4920, Entropy: 0.6946 +[2026-01-29T21:40:48.285105Z] Loop 751: Loss: 1.55e-02, Avg Return: 0.308, Regret: 0.4920, Entropy: 0.6948 +[2026-01-29T21:40:49.446259Z] Loop 752: Loss: 1.64e-02, Avg Return: 0.314, Regret: 0.4920, Entropy: 0.6949 +[2026-01-29T21:40:50.607031Z] Loop 753: Loss: 1.58e-02, Avg Return: 0.313, Regret: 0.4920, Entropy: 0.6948 +[2026-01-29T21:40:51.767555Z] Loop 754: Loss: 1.60e-02, Avg Return: 0.307, Regret: 0.4920, Entropy: 0.6948 +[2026-01-29T21:40:52.971057Z] Loop 755: Loss: 1.58e-02, Avg Return: 0.313, Regret: 0.4919, Entropy: 0.6949 +[2026-01-29T21:40:54.131589Z] Loop 756: Loss: 1.68e-02, Avg Return: 0.315, Regret: 0.4919, Entropy: 0.6949 +[2026-01-29T21:40:55.290463Z] Loop 757: Loss: 1.83e-02, Avg Return: 0.313, Regret: 0.4919, Entropy: 0.6945 +[2026-01-29T21:40:56.450221Z] Loop 758: Loss: 1.72e-02, Avg Return: 0.313, Regret: 0.4919, Entropy: 0.6943 +[2026-01-29T21:40:57.608821Z] Loop 759: Loss: 1.57e-02, Avg Return: 0.312, Regret: 0.4919, Entropy: 0.6947 +[2026-01-29T21:40:58.809873Z] Loop 760: Loss: 1.62e-02, Avg Return: 0.310, Regret: 0.4919, Entropy: 0.6950 +[2026-01-29T21:40:59.969485Z] Loop 761: Loss: 1.56e-02, Avg Return: 0.305, Regret: 0.4919, Entropy: 0.6950 +[2026-01-29T21:41:01.128979Z] Loop 762: Loss: 1.70e-02, Avg Return: 0.316, Regret: 0.4919, Entropy: 0.6946 +[2026-01-29T21:41:02.288829Z] Loop 763: Loss: 1.69e-02, Avg Return: 0.311, Regret: 0.4919, Entropy: 0.6939 +[2026-01-29T21:41:03.448949Z] Loop 764: Loss: 1.67e-02, Avg Return: 0.306, Regret: 0.4919, Entropy: 0.6934 +[2026-01-29T21:41:04.650171Z] Loop 765: Loss: 1.65e-02, Avg Return: 0.310, Regret: 0.4922, Entropy: 0.6935 +[2026-01-29T21:41:05.810807Z] Loop 766: Loss: 1.60e-02, Avg Return: 0.311, Regret: 0.4922, Entropy: 0.6940 +[2026-01-29T21:41:06.970480Z] Loop 767: Loss: 1.63e-02, Avg Return: 0.309, Regret: 0.4922, Entropy: 0.6947 +[2026-01-29T21:41:08.131196Z] Loop 768: Loss: 1.66e-02, Avg Return: 0.311, Regret: 0.4922, Entropy: 0.6949 +[2026-01-29T21:41:09.291234Z] Loop 769: Loss: 1.66e-02, Avg Return: 0.310, Regret: 0.4922, Entropy: 0.6947 +[2026-01-29T21:41:10.492971Z] Loop 770: Loss: 1.81e-02, Avg Return: 0.318, Regret: 0.4920, Entropy: 0.6944 +[2026-01-29T21:41:11.656702Z] Loop 771: Loss: 1.63e-02, Avg Return: 0.312, Regret: 0.4920, Entropy: 0.6940 +[2026-01-29T21:41:12.816678Z] Loop 772: Loss: 1.84e-02, Avg Return: 0.317, Regret: 0.4920, Entropy: 0.6936 +[2026-01-29T21:41:13.976803Z] Loop 773: Loss: 1.55e-02, Avg Return: 0.313, Regret: 0.4920, Entropy: 0.6937 +[2026-01-29T21:41:15.138767Z] Loop 774: Loss: 1.79e-02, Avg Return: 0.316, Regret: 0.4920, Entropy: 0.6943 +[2026-01-29T21:41:16.353736Z] Loop 775: Loss: 1.57e-02, Avg Return: 0.317, Regret: 0.4918, Entropy: 0.6947 +[2026-01-29T21:41:17.516041Z] Loop 776: Loss: 1.76e-02, Avg Return: 0.315, Regret: 0.4918, Entropy: 0.6947 +[2026-01-29T21:41:18.683574Z] Loop 777: Loss: 1.60e-02, Avg Return: 0.314, Regret: 0.4918, Entropy: 0.6944 +[2026-01-29T21:41:19.846997Z] Loop 778: Loss: 1.69e-02, Avg Return: 0.315, Regret: 0.4918, Entropy: 0.6942 +[2026-01-29T21:41:21.008039Z] Loop 779: Loss: 1.77e-02, Avg Return: 0.308, Regret: 0.4918, Entropy: 0.6942 +[2026-01-29T21:41:22.214313Z] Loop 780: Loss: 1.64e-02, Avg Return: 0.308, Regret: 0.4919, Entropy: 0.6938 +[2026-01-29T21:41:23.379880Z] Loop 781: Loss: 1.67e-02, Avg Return: 0.313, Regret: 0.4919, Entropy: 0.6933 +[2026-01-29T21:41:24.541876Z] Loop 782: Loss: 1.67e-02, Avg Return: 0.312, Regret: 0.4919, Entropy: 0.6934 +[2026-01-29T21:41:25.701824Z] Loop 783: Loss: 1.70e-02, Avg Return: 0.315, Regret: 0.4919, Entropy: 0.6939 +[2026-01-29T21:41:26.863916Z] Loop 784: Loss: 1.77e-02, Avg Return: 0.317, Regret: 0.4919, Entropy: 0.6944 +[2026-01-29T21:41:28.069424Z] Loop 785: Loss: 1.66e-02, Avg Return: 0.316, Regret: 0.4917, Entropy: 0.6945 +[2026-01-29T21:41:29.234436Z] Loop 786: Loss: 1.68e-02, Avg Return: 0.310, Regret: 0.4917, Entropy: 0.6945 +[2026-01-29T21:41:30.393385Z] Loop 787: Loss: 1.58e-02, Avg Return: 0.310, Regret: 0.4917, Entropy: 0.6946 +[2026-01-29T21:41:31.553856Z] Loop 788: Loss: 1.86e-02, Avg Return: 0.316, Regret: 0.4917, Entropy: 0.6946 +[2026-01-29T21:41:32.712962Z] Loop 789: Loss: 1.64e-02, Avg Return: 0.312, Regret: 0.4917, Entropy: 0.6946 +[2026-01-29T21:41:33.924266Z] Loop 790: Loss: 1.64e-02, Avg Return: 0.305, Regret: 0.4916, Entropy: 0.6946 +[2026-01-29T21:41:35.086523Z] Loop 791: Loss: 1.58e-02, Avg Return: 0.309, Regret: 0.4916, Entropy: 0.6946 +[2026-01-29T21:41:36.248205Z] Loop 792: Loss: 1.59e-02, Avg Return: 0.310, Regret: 0.4916, Entropy: 0.6946 +[2026-01-29T21:41:37.409514Z] Loop 793: Loss: 1.68e-02, Avg Return: 0.312, Regret: 0.4916, Entropy: 0.6947 +[2026-01-29T21:41:38.570800Z] Loop 794: Loss: 1.61e-02, Avg Return: 0.312, Regret: 0.4916, Entropy: 0.6947 +[2026-01-29T21:41:39.776470Z] Loop 795: Loss: 1.62e-02, Avg Return: 0.313, Regret: 0.4916, Entropy: 0.6947 +[2026-01-29T21:41:40.936964Z] Loop 796: Loss: 1.61e-02, Avg Return: 0.313, Regret: 0.4916, Entropy: 0.6946 +[2026-01-29T21:41:42.096057Z] Loop 797: Loss: 1.67e-02, Avg Return: 0.312, Regret: 0.4916, Entropy: 0.6947 +[2026-01-29T21:41:43.255840Z] Loop 798: Loss: 1.67e-02, Avg Return: 0.318, Regret: 0.4916, Entropy: 0.6948 +[2026-01-29T21:41:44.415473Z] Loop 799: Loss: 1.64e-02, Avg Return: 0.306, Regret: 0.4916, Entropy: 0.6947 +[2026-01-29T21:41:45.618365Z] Loop 800: Loss: 1.63e-02, Avg Return: 0.309, Regret: 0.4916, Entropy: 0.6946 +[2026-01-29T21:41:46.778848Z] Loop 801: Loss: 1.69e-02, Avg Return: 0.309, Regret: 0.4916, Entropy: 0.6946 +[2026-01-29T21:41:47.939388Z] Loop 802: Loss: 1.59e-02, Avg Return: 0.315, Regret: 0.4916, Entropy: 0.6947 +[2026-01-29T21:41:49.097816Z] Loop 803: Loss: 1.58e-02, Avg Return: 0.312, Regret: 0.4916, Entropy: 0.6948 +[2026-01-29T21:41:50.257805Z] Loop 804: Loss: 1.59e-02, Avg Return: 0.314, Regret: 0.4916, Entropy: 0.6948 +[2026-01-29T21:41:51.458663Z] Loop 805: Loss: 1.64e-02, Avg Return: 0.313, Regret: 0.4914, Entropy: 0.6947 +[2026-01-29T21:41:52.619278Z] Loop 806: Loss: 1.60e-02, Avg Return: 0.304, Regret: 0.4914, Entropy: 0.6947 +[2026-01-29T21:41:53.781581Z] Loop 807: Loss: 1.62e-02, Avg Return: 0.313, Regret: 0.4914, Entropy: 0.6946 +[2026-01-29T21:41:54.940873Z] Loop 808: Loss: 1.67e-02, Avg Return: 0.309, Regret: 0.4914, Entropy: 0.6945 +[2026-01-29T21:41:56.102898Z] Loop 809: Loss: 1.58e-02, Avg Return: 0.310, Regret: 0.4914, Entropy: 0.6944 +[2026-01-29T21:41:57.307462Z] Loop 810: Loss: 1.65e-02, Avg Return: 0.314, Regret: 0.4915, Entropy: 0.6943 +[2026-01-29T21:41:58.466679Z] Loop 811: Loss: 1.60e-02, Avg Return: 0.313, Regret: 0.4915, Entropy: 0.6941 +[2026-01-29T21:41:59.627690Z] Loop 812: Loss: 1.74e-02, Avg Return: 0.319, Regret: 0.4915, Entropy: 0.6943 +[2026-01-29T21:42:00.787292Z] Loop 813: Loss: 1.75e-02, Avg Return: 0.312, Regret: 0.4915, Entropy: 0.6944 +[2026-01-29T21:42:01.946656Z] Loop 814: Loss: 1.71e-02, Avg Return: 0.310, Regret: 0.4915, Entropy: 0.6945 +[2026-01-29T21:42:03.152503Z] Loop 815: Loss: 1.56e-02, Avg Return: 0.312, Regret: 0.4914, Entropy: 0.6939 +[2026-01-29T21:42:04.313861Z] Loop 816: Loss: 1.63e-02, Avg Return: 0.313, Regret: 0.4914, Entropy: 0.6925 +[2026-01-29T21:42:05.473403Z] Loop 817: Loss: 1.62e-02, Avg Return: 0.311, Regret: 0.4914, Entropy: 0.6912 +[2026-01-29T21:42:06.634534Z] Loop 818: Loss: 1.66e-02, Avg Return: 0.316, Regret: 0.4914, Entropy: 0.6904 +[2026-01-29T21:42:07.793988Z] Loop 819: Loss: 1.63e-02, Avg Return: 0.309, Regret: 0.4914, Entropy: 0.6895 +[2026-01-29T21:42:08.996823Z] Loop 820: Loss: 1.51e-02, Avg Return: 0.310, Regret: 0.4923, Entropy: 0.6906 +[2026-01-29T21:42:10.157503Z] Loop 821: Loss: 1.60e-02, Avg Return: 0.317, Regret: 0.4923, Entropy: 0.6915 +[2026-01-29T21:42:11.318111Z] Loop 822: Loss: 1.64e-02, Avg Return: 0.312, Regret: 0.4923, Entropy: 0.6922 +[2026-01-29T21:42:12.480683Z] Loop 823: Loss: 1.72e-02, Avg Return: 0.314, Regret: 0.4923, Entropy: 0.6929 +[2026-01-29T21:42:13.639874Z] Loop 824: Loss: 1.60e-02, Avg Return: 0.311, Regret: 0.4923, Entropy: 0.6932 +[2026-01-29T21:42:14.841754Z] Loop 825: Loss: 1.50e-02, Avg Return: 0.312, Regret: 0.4914, Entropy: 0.6933 +[2026-01-29T21:42:16.002407Z] Loop 826: Loss: 1.62e-02, Avg Return: 0.311, Regret: 0.4914, Entropy: 0.6938 +[2026-01-29T21:42:17.165512Z] Loop 827: Loss: 1.72e-02, Avg Return: 0.314, Regret: 0.4914, Entropy: 0.6944 +[2026-01-29T21:42:18.325728Z] Loop 828: Loss: 1.73e-02, Avg Return: 0.314, Regret: 0.4914, Entropy: 0.6940 +[2026-01-29T21:42:19.484743Z] Loop 829: Loss: 1.69e-02, Avg Return: 0.305, Regret: 0.4914, Entropy: 0.6924 +[2026-01-29T21:42:20.688041Z] Loop 830: Loss: 1.62e-02, Avg Return: 0.314, Regret: 0.4924, Entropy: 0.6905 +[2026-01-29T21:42:21.850598Z] Loop 831: Loss: 1.64e-02, Avg Return: 0.310, Regret: 0.4924, Entropy: 0.6895 +[2026-01-29T21:42:23.016911Z] Loop 832: Loss: 1.58e-02, Avg Return: 0.310, Regret: 0.4924, Entropy: 0.6913 +[2026-01-29T21:42:24.177476Z] Loop 833: Loss: 1.73e-02, Avg Return: 0.315, Regret: 0.4924, Entropy: 0.6928 +[2026-01-29T21:42:25.336972Z] Loop 834: Loss: 1.59e-02, Avg Return: 0.309, Regret: 0.4924, Entropy: 0.6940 +[2026-01-29T21:42:26.544589Z] Loop 835: Loss: 1.61e-02, Avg Return: 0.316, Regret: 0.4909, Entropy: 0.6943 +[2026-01-29T21:42:27.705182Z] Loop 836: Loss: 1.78e-02, Avg Return: 0.317, Regret: 0.4909, Entropy: 0.6937 +[2026-01-29T21:42:28.866257Z] Loop 837: Loss: 1.54e-02, Avg Return: 0.308, Regret: 0.4909, Entropy: 0.6922 +[2026-01-29T21:42:30.025886Z] Loop 838: Loss: 1.52e-02, Avg Return: 0.310, Regret: 0.4909, Entropy: 0.6913 +[2026-01-29T21:42:31.185825Z] Loop 839: Loss: 1.61e-02, Avg Return: 0.308, Regret: 0.4909, Entropy: 0.6911 +[2026-01-29T21:42:32.386675Z] Loop 840: Loss: 1.73e-02, Avg Return: 0.313, Regret: 0.4915, Entropy: 0.6916 +[2026-01-29T21:42:33.547267Z] Loop 841: Loss: 1.64e-02, Avg Return: 0.313, Regret: 0.4915, Entropy: 0.6924 +[2026-01-29T21:42:34.706188Z] Loop 842: Loss: 1.62e-02, Avg Return: 0.315, Regret: 0.4915, Entropy: 0.6936 +[2026-01-29T21:42:35.867329Z] Loop 843: Loss: 1.52e-02, Avg Return: 0.309, Regret: 0.4915, Entropy: 0.6942 +[2026-01-29T21:42:37.027551Z] Loop 844: Loss: 1.63e-02, Avg Return: 0.307, Regret: 0.4915, Entropy: 0.6941 +[2026-01-29T21:42:38.231544Z] Loop 845: Loss: 1.68e-02, Avg Return: 0.315, Regret: 0.4908, Entropy: 0.6939 +[2026-01-29T21:42:39.392922Z] Loop 846: Loss: 1.63e-02, Avg Return: 0.318, Regret: 0.4908, Entropy: 0.6935 +[2026-01-29T21:42:40.554515Z] Loop 847: Loss: 1.67e-02, Avg Return: 0.316, Regret: 0.4908, Entropy: 0.6921 +[2026-01-29T21:42:41.714449Z] Loop 848: Loss: 1.60e-02, Avg Return: 0.306, Regret: 0.4908, Entropy: 0.6911 +[2026-01-29T21:42:42.874540Z] Loop 849: Loss: 1.63e-02, Avg Return: 0.310, Regret: 0.4908, Entropy: 0.6897 +[2026-01-29T21:42:44.075067Z] Loop 850: Loss: 1.57e-02, Avg Return: 0.313, Regret: 0.4918, Entropy: 0.6903 +[2026-01-29T21:42:45.236540Z] Loop 851: Loss: 1.60e-02, Avg Return: 0.315, Regret: 0.4918, Entropy: 0.6921 +[2026-01-29T21:42:46.395951Z] Loop 852: Loss: 1.73e-02, Avg Return: 0.315, Regret: 0.4918, Entropy: 0.6937 +[2026-01-29T21:42:47.556081Z] Loop 853: Loss: 1.52e-02, Avg Return: 0.315, Regret: 0.4918, Entropy: 0.6938 +[2026-01-29T21:42:48.715261Z] Loop 854: Loss: 1.62e-02, Avg Return: 0.316, Regret: 0.4918, Entropy: 0.6912 +[2026-01-29T21:42:49.916291Z] Loop 855: Loss: 1.64e-02, Avg Return: 0.313, Regret: 0.4916, Entropy: 0.6896 +[2026-01-29T21:42:51.077002Z] Loop 856: Loss: 1.58e-02, Avg Return: 0.312, Regret: 0.4916, Entropy: 0.6888 +[2026-01-29T21:42:52.238522Z] Loop 857: Loss: 1.58e-02, Avg Return: 0.311, Regret: 0.4916, Entropy: 0.6901 +[2026-01-29T21:42:53.398369Z] Loop 858: Loss: 1.58e-02, Avg Return: 0.315, Regret: 0.4916, Entropy: 0.6928 +[2026-01-29T21:42:54.558544Z] Loop 859: Loss: 1.60e-02, Avg Return: 0.313, Regret: 0.4916, Entropy: 0.6942 +[2026-01-29T21:42:55.761255Z] Loop 860: Loss: 1.64e-02, Avg Return: 0.312, Regret: 0.4904, Entropy: 0.6940 +[2026-01-29T21:42:56.923230Z] Loop 861: Loss: 1.69e-02, Avg Return: 0.317, Regret: 0.4904, Entropy: 0.6933 +[2026-01-29T21:42:58.083268Z] Loop 862: Loss: 1.70e-02, Avg Return: 0.314, Regret: 0.4904, Entropy: 0.6927 +[2026-01-29T21:42:59.246498Z] Loop 863: Loss: 1.49e-02, Avg Return: 0.311, Regret: 0.4904, Entropy: 0.6919 +[2026-01-29T21:43:00.407830Z] Loop 864: Loss: 1.51e-02, Avg Return: 0.313, Regret: 0.4904, Entropy: 0.6920 +[2026-01-29T21:43:01.609884Z] Loop 865: Loss: 1.63e-02, Avg Return: 0.309, Regret: 0.4907, Entropy: 0.6927 +[2026-01-29T21:43:02.773709Z] Loop 866: Loss: 1.51e-02, Avg Return: 0.310, Regret: 0.4907, Entropy: 0.6937 +[2026-01-29T21:43:03.936166Z] Loop 867: Loss: 1.69e-02, Avg Return: 0.315, Regret: 0.4907, Entropy: 0.6942 +[2026-01-29T21:43:05.097152Z] Loop 868: Loss: 1.59e-02, Avg Return: 0.311, Regret: 0.4907, Entropy: 0.6942 +[2026-01-29T21:43:06.257536Z] Loop 869: Loss: 1.59e-02, Avg Return: 0.314, Regret: 0.4907, Entropy: 0.6941 +[2026-01-29T21:43:07.463897Z] Loop 870: Loss: 1.62e-02, Avg Return: 0.309, Regret: 0.4900, Entropy: 0.6940 +[2026-01-29T21:43:08.626626Z] Loop 871: Loss: 1.63e-02, Avg Return: 0.315, Regret: 0.4900, Entropy: 0.6940 +[2026-01-29T21:43:09.787493Z] Loop 872: Loss: 1.50e-02, Avg Return: 0.309, Regret: 0.4900, Entropy: 0.6940 +[2026-01-29T21:43:10.948617Z] Loop 873: Loss: 1.71e-02, Avg Return: 0.318, Regret: 0.4900, Entropy: 0.6941 +[2026-01-29T21:43:12.110797Z] Loop 874: Loss: 1.59e-02, Avg Return: 0.319, Regret: 0.4900, Entropy: 0.6941 +[2026-01-29T21:43:13.315974Z] Loop 875: Loss: 1.67e-02, Avg Return: 0.312, Regret: 0.4897, Entropy: 0.6941 +[2026-01-29T21:43:14.477153Z] Loop 876: Loss: 1.70e-02, Avg Return: 0.317, Regret: 0.4897, Entropy: 0.6940 +[2026-01-29T21:43:15.638554Z] Loop 877: Loss: 1.61e-02, Avg Return: 0.313, Regret: 0.4897, Entropy: 0.6939 +[2026-01-29T21:43:16.800297Z] Loop 878: Loss: 1.58e-02, Avg Return: 0.314, Regret: 0.4897, Entropy: 0.6939 +[2026-01-29T21:43:17.961422Z] Loop 879: Loss: 1.56e-02, Avg Return: 0.314, Regret: 0.4897, Entropy: 0.6939 +[2026-01-29T21:43:19.174011Z] Loop 880: Loss: 1.64e-02, Avg Return: 0.320, Regret: 0.4895, Entropy: 0.6938 +[2026-01-29T21:43:20.332565Z] Loop 881: Loss: 1.65e-02, Avg Return: 0.319, Regret: 0.4895, Entropy: 0.6936 +[2026-01-29T21:43:21.492953Z] Loop 882: Loss: 1.61e-02, Avg Return: 0.313, Regret: 0.4895, Entropy: 0.6933 +[2026-01-29T21:43:22.651731Z] Loop 883: Loss: 1.63e-02, Avg Return: 0.314, Regret: 0.4895, Entropy: 0.6929 +[2026-01-29T21:43:23.810993Z] Loop 884: Loss: 1.60e-02, Avg Return: 0.311, Regret: 0.4895, Entropy: 0.6930 +[2026-01-29T21:43:25.011598Z] Loop 885: Loss: 1.59e-02, Avg Return: 0.318, Regret: 0.4893, Entropy: 0.6930 +[2026-01-29T21:43:26.173306Z] Loop 886: Loss: 1.60e-02, Avg Return: 0.310, Regret: 0.4893, Entropy: 0.6930 +[2026-01-29T21:43:27.333299Z] Loop 887: Loss: 1.59e-02, Avg Return: 0.311, Regret: 0.4893, Entropy: 0.6935 +[2026-01-29T21:43:28.494393Z] Loop 888: Loss: 1.50e-02, Avg Return: 0.308, Regret: 0.4893, Entropy: 0.6935 +[2026-01-29T21:43:29.654714Z] Loop 889: Loss: 1.57e-02, Avg Return: 0.305, Regret: 0.4893, Entropy: 0.6927 +[2026-01-29T21:43:30.858414Z] Loop 890: Loss: 1.72e-02, Avg Return: 0.323, Regret: 0.4895, Entropy: 0.6915 +[2026-01-29T21:43:32.021156Z] Loop 891: Loss: 1.51e-02, Avg Return: 0.314, Regret: 0.4895, Entropy: 0.6903 +[2026-01-29T21:43:33.180790Z] Loop 892: Loss: 1.73e-02, Avg Return: 0.310, Regret: 0.4895, Entropy: 0.6904 +[2026-01-29T21:43:34.339839Z] Loop 893: Loss: 1.56e-02, Avg Return: 0.310, Regret: 0.4895, Entropy: 0.6920 +[2026-01-29T21:43:35.501726Z] Loop 894: Loss: 1.61e-02, Avg Return: 0.317, Regret: 0.4895, Entropy: 0.6929 +[2026-01-29T21:43:36.707521Z] Loop 895: Loss: 1.64e-02, Avg Return: 0.312, Regret: 0.4884, Entropy: 0.6929 +[2026-01-29T21:43:37.867625Z] Loop 896: Loss: 1.57e-02, Avg Return: 0.314, Regret: 0.4884, Entropy: 0.6919 +[2026-01-29T21:43:39.027025Z] Loop 897: Loss: 1.63e-02, Avg Return: 0.318, Regret: 0.4884, Entropy: 0.6906 +[2026-01-29T21:43:40.186696Z] Loop 898: Loss: 1.63e-02, Avg Return: 0.319, Regret: 0.4884, Entropy: 0.6896 +[2026-01-29T21:43:41.346351Z] Loop 899: Loss: 1.52e-02, Avg Return: 0.316, Regret: 0.4884, Entropy: 0.6914 +[2026-01-29T21:43:42.549145Z] Loop 900: Loss: 1.58e-02, Avg Return: 0.323, Regret: 0.4881, Entropy: 0.6924 +[2026-01-29T21:43:43.709922Z] Loop 901: Loss: 1.67e-02, Avg Return: 0.316, Regret: 0.4881, Entropy: 0.6925 +[2026-01-29T21:43:44.869863Z] Loop 902: Loss: 1.74e-02, Avg Return: 0.323, Regret: 0.4881, Entropy: 0.6905 +[2026-01-29T21:43:46.029382Z] Loop 903: Loss: 1.64e-02, Avg Return: 0.315, Regret: 0.4881, Entropy: 0.6879 +[2026-01-29T21:43:47.188836Z] Loop 904: Loss: 1.64e-02, Avg Return: 0.311, Regret: 0.4881, Entropy: 0.6872 +[2026-01-29T21:43:48.388044Z] Loop 905: Loss: 1.62e-02, Avg Return: 0.323, Regret: 0.4886, Entropy: 0.6896 +[2026-01-29T21:43:49.548738Z] Loop 906: Loss: 1.54e-02, Avg Return: 0.317, Regret: 0.4886, Entropy: 0.6915 +[2026-01-29T21:43:50.708269Z] Loop 907: Loss: 1.66e-02, Avg Return: 0.321, Regret: 0.4886, Entropy: 0.6921 +[2026-01-29T21:43:51.875787Z] Loop 908: Loss: 1.58e-02, Avg Return: 0.317, Regret: 0.4886, Entropy: 0.6922 +[2026-01-29T21:43:53.034034Z] Loop 909: Loss: 1.65e-02, Avg Return: 0.323, Regret: 0.4886, Entropy: 0.6920 +[2026-01-29T21:43:54.236524Z] Loop 910: Loss: 1.59e-02, Avg Return: 0.320, Regret: 0.4871, Entropy: 0.6918 +[2026-01-29T21:43:55.397617Z] Loop 911: Loss: 1.64e-02, Avg Return: 0.319, Regret: 0.4871, Entropy: 0.6917 +[2026-01-29T21:43:56.556657Z] Loop 912: Loss: 1.56e-02, Avg Return: 0.324, Regret: 0.4871, Entropy: 0.6919 +[2026-01-29T21:43:57.715033Z] Loop 913: Loss: 1.64e-02, Avg Return: 0.323, Regret: 0.4871, Entropy: 0.6919 +[2026-01-29T21:43:58.875848Z] Loop 914: Loss: 1.69e-02, Avg Return: 0.313, Regret: 0.4871, Entropy: 0.6917 +[2026-01-29T21:44:00.079029Z] Loop 915: Loss: 1.64e-02, Avg Return: 0.313, Regret: 0.4864, Entropy: 0.6916 +[2026-01-29T21:44:01.239769Z] Loop 916: Loss: 1.54e-02, Avg Return: 0.319, Regret: 0.4864, Entropy: 0.6915 +[2026-01-29T21:44:02.399377Z] Loop 917: Loss: 1.59e-02, Avg Return: 0.318, Regret: 0.4864, Entropy: 0.6915 +[2026-01-29T21:44:03.558864Z] Loop 918: Loss: 1.45e-02, Avg Return: 0.314, Regret: 0.4864, Entropy: 0.6913 +[2026-01-29T21:44:04.718207Z] Loop 919: Loss: 1.65e-02, Avg Return: 0.319, Regret: 0.4864, Entropy: 0.6906 +[2026-01-29T21:44:05.920771Z] Loop 920: Loss: 1.56e-02, Avg Return: 0.320, Regret: 0.4856, Entropy: 0.6906 +[2026-01-29T21:44:07.081945Z] Loop 921: Loss: 1.56e-02, Avg Return: 0.322, Regret: 0.4856, Entropy: 0.6904 +[2026-01-29T21:44:08.243214Z] Loop 922: Loss: 1.66e-02, Avg Return: 0.319, Regret: 0.4856, Entropy: 0.6902 +[2026-01-29T21:44:09.403053Z] Loop 923: Loss: 1.58e-02, Avg Return: 0.318, Regret: 0.4856, Entropy: 0.6906 +[2026-01-29T21:44:10.563569Z] Loop 924: Loss: 1.66e-02, Avg Return: 0.316, Regret: 0.4856, Entropy: 0.6902 +[2026-01-29T21:44:11.765534Z] Loop 925: Loss: 1.56e-02, Avg Return: 0.314, Regret: 0.4847, Entropy: 0.6897 +[2026-01-29T21:44:12.927901Z] Loop 926: Loss: 1.58e-02, Avg Return: 0.320, Regret: 0.4847, Entropy: 0.6899 +[2026-01-29T21:44:14.087582Z] Loop 927: Loss: 1.58e-02, Avg Return: 0.328, Regret: 0.4847, Entropy: 0.6888 +[2026-01-29T21:44:15.249553Z] Loop 928: Loss: 1.59e-02, Avg Return: 0.322, Regret: 0.4847, Entropy: 0.6864 +[2026-01-29T21:44:16.409007Z] Loop 929: Loss: 1.68e-02, Avg Return: 0.322, Regret: 0.4847, Entropy: 0.6847 +[2026-01-29T21:44:17.621490Z] Loop 930: Loss: 1.53e-02, Avg Return: 0.321, Regret: 0.4843, Entropy: 0.6838 +[2026-01-29T21:44:18.782918Z] Loop 931: Loss: 1.57e-02, Avg Return: 0.322, Regret: 0.4843, Entropy: 0.6857 +[2026-01-29T21:44:19.943687Z] Loop 932: Loss: 1.49e-02, Avg Return: 0.316, Regret: 0.4843, Entropy: 0.6869 +[2026-01-29T21:44:21.103027Z] Loop 933: Loss: 1.56e-02, Avg Return: 0.317, Regret: 0.4843, Entropy: 0.6878 +[2026-01-29T21:44:22.262445Z] Loop 934: Loss: 1.43e-02, Avg Return: 0.319, Regret: 0.4843, Entropy: 0.6864 +[2026-01-29T21:44:23.468973Z] Loop 935: Loss: 1.49e-02, Avg Return: 0.325, Regret: 0.4826, Entropy: 0.6850 +[2026-01-29T21:44:24.629943Z] Loop 936: Loss: 1.58e-02, Avg Return: 0.327, Regret: 0.4826, Entropy: 0.6845 +[2026-01-29T21:44:25.789336Z] Loop 937: Loss: 1.54e-02, Avg Return: 0.326, Regret: 0.4826, Entropy: 0.6845 +[2026-01-29T21:44:26.948189Z] Loop 938: Loss: 1.54e-02, Avg Return: 0.322, Regret: 0.4826, Entropy: 0.6847 +[2026-01-29T21:44:28.109240Z] Loop 939: Loss: 1.43e-02, Avg Return: 0.317, Regret: 0.4826, Entropy: 0.6851 +[2026-01-29T21:44:29.312743Z] Loop 940: Loss: 1.52e-02, Avg Return: 0.321, Regret: 0.4809, Entropy: 0.6813 +[2026-01-29T21:44:30.472305Z] Loop 941: Loss: 1.46e-02, Avg Return: 0.321, Regret: 0.4809, Entropy: 0.6798 +[2026-01-29T21:44:31.632628Z] Loop 942: Loss: 1.47e-02, Avg Return: 0.329, Regret: 0.4809, Entropy: 0.6822 +[2026-01-29T21:44:32.791872Z] Loop 943: Loss: 1.43e-02, Avg Return: 0.325, Regret: 0.4809, Entropy: 0.6834 +[2026-01-29T21:44:33.951984Z] Loop 944: Loss: 1.40e-02, Avg Return: 0.327, Regret: 0.4809, Entropy: 0.6818 +[2026-01-29T21:44:35.155352Z] Loop 945: Loss: 1.60e-02, Avg Return: 0.330, Regret: 0.4785, Entropy: 0.6803 +[2026-01-29T21:44:36.315278Z] Loop 946: Loss: 1.60e-02, Avg Return: 0.328, Regret: 0.4785, Entropy: 0.6801 +[2026-01-29T21:44:37.474013Z] Loop 947: Loss: 1.42e-02, Avg Return: 0.324, Regret: 0.4785, Entropy: 0.6767 +[2026-01-29T21:44:38.633882Z] Loop 948: Loss: 1.49e-02, Avg Return: 0.327, Regret: 0.4785, Entropy: 0.6754 +[2026-01-29T21:44:39.795158Z] Loop 949: Loss: 1.34e-02, Avg Return: 0.317, Regret: 0.4785, Entropy: 0.6761 +[2026-01-29T21:44:40.998731Z] Loop 950: Loss: 1.44e-02, Avg Return: 0.327, Regret: 0.4762, Entropy: 0.6774 +[2026-01-29T21:44:42.157062Z] Loop 951: Loss: 1.42e-02, Avg Return: 0.320, Regret: 0.4762, Entropy: 0.6741 +[2026-01-29T21:44:43.315993Z] Loop 952: Loss: 1.44e-02, Avg Return: 0.330, Regret: 0.4762, Entropy: 0.6709 +[2026-01-29T21:44:44.474284Z] Loop 953: Loss: 1.42e-02, Avg Return: 0.330, Regret: 0.4762, Entropy: 0.6724 +[2026-01-29T21:44:45.633047Z] Loop 954: Loss: 1.47e-02, Avg Return: 0.330, Regret: 0.4762, Entropy: 0.6720 +[2026-01-29T21:44:46.838078Z] Loop 955: Loss: 1.45e-02, Avg Return: 0.329, Regret: 0.4742, Entropy: 0.6702 +[2026-01-29T21:44:48.003001Z] Loop 956: Loss: 1.40e-02, Avg Return: 0.331, Regret: 0.4742, Entropy: 0.6681 +[2026-01-29T21:44:49.164786Z] Loop 957: Loss: 1.38e-02, Avg Return: 0.328, Regret: 0.4742, Entropy: 0.6645 +[2026-01-29T21:44:50.325206Z] Loop 958: Loss: 1.26e-02, Avg Return: 0.333, Regret: 0.4742, Entropy: 0.6647 +[2026-01-29T21:44:51.485647Z] Loop 959: Loss: 1.38e-02, Avg Return: 0.329, Regret: 0.4742, Entropy: 0.6642 +[2026-01-29T21:44:52.691362Z] Loop 960: Loss: 1.50e-02, Avg Return: 0.336, Regret: 0.4721, Entropy: 0.6627 +[2026-01-29T21:44:53.850905Z] Loop 961: Loss: 1.41e-02, Avg Return: 0.325, Regret: 0.4721, Entropy: 0.6465 +[2026-01-29T21:44:55.010468Z] Loop 962: Loss: 1.37e-02, Avg Return: 0.324, Regret: 0.4721, Entropy: 0.6455 +[2026-01-29T21:44:56.171870Z] Loop 963: Loss: 1.36e-02, Avg Return: 0.336, Regret: 0.4721, Entropy: 0.6540 +[2026-01-29T21:44:57.330441Z] Loop 964: Loss: 1.38e-02, Avg Return: 0.333, Regret: 0.4721, Entropy: 0.6533 +[2026-01-29T21:44:58.534560Z] Loop 965: Loss: 1.46e-02, Avg Return: 0.334, Regret: 0.4740, Entropy: 0.6396 +[2026-01-29T21:44:59.695551Z] Loop 966: Loss: 1.38e-02, Avg Return: 0.335, Regret: 0.4740, Entropy: 0.6406 +[2026-01-29T21:45:00.856120Z] Loop 967: Loss: 1.38e-02, Avg Return: 0.340, Regret: 0.4740, Entropy: 0.6486 +[2026-01-29T21:45:02.015537Z] Loop 968: Loss: 1.21e-02, Avg Return: 0.329, Regret: 0.4740, Entropy: 0.6438 +[2026-01-29T21:45:03.174901Z] Loop 969: Loss: 1.30e-02, Avg Return: 0.326, Regret: 0.4740, Entropy: 0.6210 +[2026-01-29T21:45:04.376193Z] Loop 970: Loss: 1.35e-02, Avg Return: 0.333, Regret: 0.4749, Entropy: 0.6102 +[2026-01-29T21:45:05.536190Z] Loop 971: Loss: 1.26e-02, Avg Return: 0.330, Regret: 0.4749, Entropy: 0.6359 +[2026-01-29T21:45:06.696215Z] Loop 972: Loss: 1.28e-02, Avg Return: 0.339, Regret: 0.4749, Entropy: 0.6359 +[2026-01-29T21:45:07.857496Z] Loop 973: Loss: 1.27e-02, Avg Return: 0.334, Regret: 0.4749, Entropy: 0.6159 +[2026-01-29T21:45:09.016614Z] Loop 974: Loss: 1.23e-02, Avg Return: 0.334, Regret: 0.4749, Entropy: 0.6115 +[2026-01-29T21:45:10.223215Z] Loop 975: Loss: 1.24e-02, Avg Return: 0.341, Regret: 0.4676, Entropy: 0.6251 +[2026-01-29T21:45:11.382902Z] Loop 976: Loss: 1.18e-02, Avg Return: 0.341, Regret: 0.4676, Entropy: 0.6292 +[2026-01-29T21:45:12.543968Z] Loop 977: Loss: 1.26e-02, Avg Return: 0.338, Regret: 0.4676, Entropy: 0.6068 +[2026-01-29T21:45:13.702989Z] Loop 978: Loss: 1.19e-02, Avg Return: 0.325, Regret: 0.4676, Entropy: 0.5923 +[2026-01-29T21:45:14.862466Z] Loop 979: Loss: 1.32e-02, Avg Return: 0.339, Regret: 0.4676, Entropy: 0.5872 +[2026-01-29T21:45:16.067275Z] Loop 980: Loss: 1.17e-02, Avg Return: 0.331, Regret: 0.4660, Entropy: 0.6033 +[2026-01-29T21:45:17.228070Z] Loop 981: Loss: 1.11e-02, Avg Return: 0.343, Regret: 0.4660, Entropy: 0.6201 +[2026-01-29T21:45:18.387915Z] Loop 982: Loss: 1.20e-02, Avg Return: 0.338, Regret: 0.4660, Entropy: 0.6167 +[2026-01-29T21:45:19.549286Z] Loop 983: Loss: 1.13e-02, Avg Return: 0.343, Regret: 0.4660, Entropy: 0.6109 +[2026-01-29T21:45:20.708646Z] Loop 984: Loss: 1.22e-02, Avg Return: 0.346, Regret: 0.4660, Entropy: 0.6098 +[2026-01-29T21:45:21.914204Z] Loop 985: Loss: 1.12e-02, Avg Return: 0.346, Regret: 0.4627, Entropy: 0.6092 +[2026-01-29T21:45:23.074947Z] Loop 986: Loss: 1.13e-02, Avg Return: 0.341, Regret: 0.4627, Entropy: 0.6089 +[2026-01-29T21:45:24.238408Z] Loop 987: Loss: 1.11e-02, Avg Return: 0.342, Regret: 0.4627, Entropy: 0.6043 +[2026-01-29T21:45:25.399271Z] Loop 988: Loss: 1.05e-02, Avg Return: 0.338, Regret: 0.4627, Entropy: 0.5987 +[2026-01-29T21:45:26.560731Z] Loop 989: Loss: 1.10e-02, Avg Return: 0.348, Regret: 0.4627, Entropy: 0.5978 +[2026-01-29T21:45:27.772390Z] Loop 990: Loss: 1.04e-02, Avg Return: 0.342, Regret: 0.4596, Entropy: 0.5971 +[2026-01-29T21:45:28.932410Z] Loop 991: Loss: 1.00e-02, Avg Return: 0.343, Regret: 0.4596, Entropy: 0.5927 +[2026-01-29T21:45:30.090650Z] Loop 992: Loss: 1.05e-02, Avg Return: 0.343, Regret: 0.4596, Entropy: 0.5854 +[2026-01-29T21:45:31.250821Z] Loop 993: Loss: 1.10e-02, Avg Return: 0.350, Regret: 0.4596, Entropy: 0.5729 +[2026-01-29T21:45:32.411168Z] Loop 994: Loss: 9.63e-03, Avg Return: 0.338, Regret: 0.4596, Entropy: 0.5666 +[2026-01-29T21:45:33.616251Z] Loop 995: Loss: 1.06e-02, Avg Return: 0.341, Regret: 0.4584, Entropy: 0.5659 +[2026-01-29T21:45:34.775386Z] Loop 996: Loss: 1.02e-02, Avg Return: 0.344, Regret: 0.4584, Entropy: 0.5780 +[2026-01-29T21:45:35.935123Z] Loop 997: Loss: 9.59e-03, Avg Return: 0.343, Regret: 0.4584, Entropy: 0.5822 +[2026-01-29T21:45:37.094835Z] Loop 998: Loss: 9.44e-03, Avg Return: 0.349, Regret: 0.4584, Entropy: 0.5771 +[2026-01-29T21:45:38.254177Z] Loop 999: Loss: 1.01e-02, Avg Return: 0.352, Regret: 0.4584, Entropy: 0.5737 +[2026-01-29T21:45:39.460174Z] Loop 1000: Loss: 9.94e-03, Avg Return: 0.351, Regret: 0.4565, Entropy: 0.5744 +[2026-01-29T21:45:40.621186Z] Loop 1001: Loss: 9.82e-03, Avg Return: 0.347, Regret: 0.4565, Entropy: 0.5738 +[2026-01-29T21:45:41.780895Z] Loop 1002: Loss: 1.01e-02, Avg Return: 0.346, Regret: 0.4565, Entropy: 0.5652 +[2026-01-29T21:45:42.941287Z] Loop 1003: Loss: 1.05e-02, Avg Return: 0.348, Regret: 0.4565, Entropy: 0.5623 +[2026-01-29T21:45:44.101661Z] Loop 1004: Loss: 1.03e-02, Avg Return: 0.349, Regret: 0.4565, Entropy: 0.5548 +[2026-01-29T21:45:45.308544Z] Loop 1005: Loss: 9.80e-03, Avg Return: 0.340, Regret: 0.4560, Entropy: 0.5591 +[2026-01-29T21:45:46.468156Z] Loop 1006: Loss: 9.38e-03, Avg Return: 0.356, Regret: 0.4560, Entropy: 0.5517 +[2026-01-29T21:45:47.629061Z] Loop 1007: Loss: 9.83e-03, Avg Return: 0.346, Regret: 0.4560, Entropy: 0.5214 +[2026-01-29T21:45:48.790104Z] Loop 1008: Loss: 9.89e-03, Avg Return: 0.333, Regret: 0.4560, Entropy: 0.4783 +[2026-01-29T21:45:49.949526Z] Loop 1009: Loss: 1.16e-02, Avg Return: 0.341, Regret: 0.4560, Entropy: 0.4541 +[2026-01-29T21:45:51.154864Z] Loop 1010: Loss: 1.04e-02, Avg Return: 0.341, Regret: 0.4583, Entropy: 0.4867 +[2026-01-29T21:45:52.316960Z] Loop 1011: Loss: 9.12e-03, Avg Return: 0.348, Regret: 0.4583, Entropy: 0.5211 +[2026-01-29T21:45:53.481388Z] Loop 1012: Loss: 9.23e-03, Avg Return: 0.353, Regret: 0.4583, Entropy: 0.5449 +[2026-01-29T21:45:54.640905Z] Loop 1013: Loss: 9.66e-03, Avg Return: 0.350, Regret: 0.4583, Entropy: 0.5370 +[2026-01-29T21:45:55.800436Z] Loop 1014: Loss: 1.00e-02, Avg Return: 0.347, Regret: 0.4583, Entropy: 0.5233 +[2026-01-29T21:45:57.005315Z] Loop 1015: Loss: 1.12e-02, Avg Return: 0.351, Regret: 0.4593, Entropy: 0.5130 +[2026-01-29T21:45:58.167589Z] Loop 1016: Loss: 8.77e-03, Avg Return: 0.349, Regret: 0.4593, Entropy: 0.5283 +[2026-01-29T21:45:59.326918Z] Loop 1017: Loss: 9.67e-03, Avg Return: 0.354, Regret: 0.4593, Entropy: 0.5329 +[2026-01-29T21:46:00.487409Z] Loop 1018: Loss: 9.15e-03, Avg Return: 0.356, Regret: 0.4593, Entropy: 0.5253 +[2026-01-29T21:46:01.646180Z] Loop 1019: Loss: 9.56e-03, Avg Return: 0.357, Regret: 0.4593, Entropy: 0.5002 +[2026-01-29T21:46:02.853536Z] Loop 1020: Loss: 8.74e-03, Avg Return: 0.356, Regret: 0.4508, Entropy: 0.4828 +[2026-01-29T21:46:04.014305Z] Loop 1021: Loss: 8.78e-03, Avg Return: 0.352, Regret: 0.4508, Entropy: 0.4605 +[2026-01-29T21:46:05.173762Z] Loop 1022: Loss: 8.78e-03, Avg Return: 0.367, Regret: 0.4508, Entropy: 0.4798 +[2026-01-29T21:46:06.332865Z] Loop 1023: Loss: 7.86e-03, Avg Return: 0.352, Regret: 0.4508, Entropy: 0.4952 +[2026-01-29T21:46:07.492420Z] Loop 1024: Loss: 9.14e-03, Avg Return: 0.362, Regret: 0.4508, Entropy: 0.5058 +[2026-01-29T21:46:08.702348Z] Loop 1025: Loss: 8.33e-03, Avg Return: 0.352, Regret: 0.4494, Entropy: 0.5066 +[2026-01-29T21:46:09.863403Z] Loop 1026: Loss: 8.87e-03, Avg Return: 0.352, Regret: 0.4494, Entropy: 0.4959 +[2026-01-29T21:46:11.029263Z] Loop 1027: Loss: 8.81e-03, Avg Return: 0.347, Regret: 0.4494, Entropy: 0.4802 +[2026-01-29T21:46:12.188931Z] Loop 1028: Loss: 8.68e-03, Avg Return: 0.359, Regret: 0.4494, Entropy: 0.4978 +[2026-01-29T21:46:13.353282Z] Loop 1029: Loss: 7.92e-03, Avg Return: 0.355, Regret: 0.4494, Entropy: 0.4889 +[2026-01-29T21:46:14.560420Z] Loop 1030: Loss: 8.11e-03, Avg Return: 0.361, Regret: 0.4461, Entropy: 0.4622 +[2026-01-29T21:46:15.720201Z] Loop 1031: Loss: 8.18e-03, Avg Return: 0.355, Regret: 0.4461, Entropy: 0.4194 +[2026-01-29T21:46:16.880270Z] Loop 1032: Loss: 8.81e-03, Avg Return: 0.349, Regret: 0.4461, Entropy: 0.3886 +[2026-01-29T21:46:18.040842Z] Loop 1033: Loss: 8.95e-03, Avg Return: 0.353, Regret: 0.4461, Entropy: 0.3859 +[2026-01-29T21:46:19.200476Z] Loop 1034: Loss: 8.18e-03, Avg Return: 0.357, Regret: 0.4461, Entropy: 0.4142 +[2026-01-29T21:46:20.407550Z] Loop 1035: Loss: 8.17e-03, Avg Return: 0.368, Regret: 0.4445, Entropy: 0.4471 +[2026-01-29T21:46:21.567649Z] Loop 1036: Loss: 7.40e-03, Avg Return: 0.360, Regret: 0.4445, Entropy: 0.4826 +[2026-01-29T21:46:22.727097Z] Loop 1037: Loss: 7.71e-03, Avg Return: 0.362, Regret: 0.4445, Entropy: 0.4838 +[2026-01-29T21:46:23.886877Z] Loop 1038: Loss: 8.21e-03, Avg Return: 0.352, Regret: 0.4445, Entropy: 0.4623 +[2026-01-29T21:46:25.048022Z] Loop 1039: Loss: 9.48e-03, Avg Return: 0.347, Regret: 0.4445, Entropy: 0.4490 +[2026-01-29T21:46:26.255266Z] Loop 1040: Loss: 9.34e-03, Avg Return: 0.352, Regret: 0.4497, Entropy: 0.4563 +[2026-01-29T21:46:27.415999Z] Loop 1041: Loss: 7.50e-03, Avg Return: 0.360, Regret: 0.4497, Entropy: 0.4736 +[2026-01-29T21:46:28.575167Z] Loop 1042: Loss: 7.48e-03, Avg Return: 0.358, Regret: 0.4497, Entropy: 0.4733 +[2026-01-29T21:46:29.737150Z] Loop 1043: Loss: 7.88e-03, Avg Return: 0.366, Regret: 0.4497, Entropy: 0.4600 +[2026-01-29T21:46:30.897486Z] Loop 1044: Loss: 7.78e-03, Avg Return: 0.367, Regret: 0.4497, Entropy: 0.3985 +[2026-01-29T21:46:32.102294Z] Loop 1045: Loss: 8.29e-03, Avg Return: 0.352, Regret: 0.4504, Entropy: 0.3460 +[2026-01-29T21:46:33.262090Z] Loop 1046: Loss: 8.60e-03, Avg Return: 0.344, Regret: 0.4504, Entropy: 0.3236 +[2026-01-29T21:46:34.423112Z] Loop 1047: Loss: 8.86e-03, Avg Return: 0.354, Regret: 0.4504, Entropy: 0.3405 +[2026-01-29T21:46:35.585567Z] Loop 1048: Loss: 7.13e-03, Avg Return: 0.359, Regret: 0.4504, Entropy: 0.3799 +[2026-01-29T21:46:36.751189Z] Loop 1049: Loss: 7.11e-03, Avg Return: 0.367, Regret: 0.4504, Entropy: 0.4313 +[2026-01-29T21:46:37.960502Z] Loop 1050: Loss: 7.04e-03, Avg Return: 0.363, Regret: 0.4400, Entropy: 0.4565 +[2026-01-29T21:46:39.121072Z] Loop 1051: Loss: 7.11e-03, Avg Return: 0.364, Regret: 0.4400, Entropy: 0.4459 +[2026-01-29T21:46:40.280564Z] Loop 1052: Loss: 7.56e-03, Avg Return: 0.356, Regret: 0.4400, Entropy: 0.4213 +[2026-01-29T21:46:41.440846Z] Loop 1053: Loss: 7.56e-03, Avg Return: 0.357, Regret: 0.4400, Entropy: 0.4267 +[2026-01-29T21:46:42.602339Z] Loop 1054: Loss: 7.11e-03, Avg Return: 0.360, Regret: 0.4400, Entropy: 0.4315 +[2026-01-29T21:46:43.818117Z] Loop 1055: Loss: 6.72e-03, Avg Return: 0.368, Regret: 0.4400, Entropy: 0.4479 +[2026-01-29T21:46:44.980253Z] Loop 1056: Loss: 6.57e-03, Avg Return: 0.367, Regret: 0.4400, Entropy: 0.4423 +[2026-01-29T21:46:46.142828Z] Loop 1057: Loss: 6.49e-03, Avg Return: 0.368, Regret: 0.4400, Entropy: 0.4074 +[2026-01-29T21:46:47.304228Z] Loop 1058: Loss: 6.62e-03, Avg Return: 0.362, Regret: 0.4400, Entropy: 0.3674 +[2026-01-29T21:46:48.463519Z] Loop 1059: Loss: 6.64e-03, Avg Return: 0.362, Regret: 0.4400, Entropy: 0.3334 +[2026-01-29T21:46:49.668701Z] Loop 1060: Loss: 7.82e-03, Avg Return: 0.355, Regret: 0.4467, Entropy: 0.3108 +[2026-01-29T21:46:50.828310Z] Loop 1061: Loss: 7.22e-03, Avg Return: 0.356, Regret: 0.4467, Entropy: 0.2992 +[2026-01-29T21:46:51.989655Z] Loop 1062: Loss: 7.35e-03, Avg Return: 0.363, Regret: 0.4467, Entropy: 0.3088 +[2026-01-29T21:46:53.149392Z] Loop 1063: Loss: 6.77e-03, Avg Return: 0.360, Regret: 0.4467, Entropy: 0.3251 +[2026-01-29T21:46:54.309345Z] Loop 1064: Loss: 6.41e-03, Avg Return: 0.358, Regret: 0.4467, Entropy: 0.3419 +[2026-01-29T21:46:55.514708Z] Loop 1065: Loss: 5.96e-03, Avg Return: 0.370, Regret: 0.4359, Entropy: 0.3751 +[2026-01-29T21:46:56.676300Z] Loop 1066: Loss: 6.03e-03, Avg Return: 0.365, Regret: 0.4359, Entropy: 0.3995 +[2026-01-29T21:46:57.840593Z] Loop 1067: Loss: 6.68e-03, Avg Return: 0.371, Regret: 0.4359, Entropy: 0.4054 +[2026-01-29T21:46:59.002899Z] Loop 1068: Loss: 5.75e-03, Avg Return: 0.374, Regret: 0.4359, Entropy: 0.4279 +[2026-01-29T21:47:00.163419Z] Loop 1069: Loss: 6.80e-03, Avg Return: 0.372, Regret: 0.4359, Entropy: 0.4039 +[2026-01-29T21:47:01.379829Z] Loop 1070: Loss: 6.20e-03, Avg Return: 0.363, Regret: 0.4361, Entropy: 0.4023 +[2026-01-29T21:47:02.542847Z] Loop 1071: Loss: 5.73e-03, Avg Return: 0.367, Regret: 0.4361, Entropy: 0.3987 +[2026-01-29T21:47:03.702161Z] Loop 1072: Loss: 6.89e-03, Avg Return: 0.370, Regret: 0.4361, Entropy: 0.3703 +[2026-01-29T21:47:04.863146Z] Loop 1073: Loss: 5.89e-03, Avg Return: 0.365, Regret: 0.4361, Entropy: 0.3683 +[2026-01-29T21:47:06.022873Z] Loop 1074: Loss: 6.42e-03, Avg Return: 0.367, Regret: 0.4361, Entropy: 0.3751 +[2026-01-29T21:47:07.230097Z] Loop 1075: Loss: 6.19e-03, Avg Return: 0.368, Regret: 0.4345, Entropy: 0.3910 +[2026-01-29T21:47:08.390708Z] Loop 1076: Loss: 6.04e-03, Avg Return: 0.370, Regret: 0.4345, Entropy: 0.4165 +[2026-01-29T21:47:09.552191Z] Loop 1077: Loss: 6.04e-03, Avg Return: 0.366, Regret: 0.4345, Entropy: 0.4090 +[2026-01-29T21:47:10.712160Z] Loop 1078: Loss: 5.87e-03, Avg Return: 0.371, Regret: 0.4345, Entropy: 0.4002 +[2026-01-29T21:47:11.873242Z] Loop 1079: Loss: 5.26e-03, Avg Return: 0.374, Regret: 0.4345, Entropy: 0.3836 +[2026-01-29T21:47:13.082176Z] Loop 1080: Loss: 5.32e-03, Avg Return: 0.369, Regret: 0.4315, Entropy: 0.3520 +[2026-01-29T21:47:14.245351Z] Loop 1081: Loss: 5.77e-03, Avg Return: 0.369, Regret: 0.4315, Entropy: 0.3151 +[2026-01-29T21:47:15.407233Z] Loop 1082: Loss: 5.75e-03, Avg Return: 0.374, Regret: 0.4315, Entropy: 0.2870 +[2026-01-29T21:47:16.568715Z] Loop 1083: Loss: 5.49e-03, Avg Return: 0.364, Regret: 0.4315, Entropy: 0.2752 +[2026-01-29T21:47:17.729242Z] Loop 1084: Loss: 5.23e-03, Avg Return: 0.369, Regret: 0.4315, Entropy: 0.2477 +[2026-01-29T21:47:18.940907Z] Loop 1085: Loss: 5.73e-03, Avg Return: 0.366, Regret: 0.4372, Entropy: 0.2411 +[2026-01-29T21:47:20.101391Z] Loop 1086: Loss: 5.40e-03, Avg Return: 0.366, Regret: 0.4372, Entropy: 0.2710 +[2026-01-29T21:47:21.261247Z] Loop 1087: Loss: 5.36e-03, Avg Return: 0.379, Regret: 0.4372, Entropy: 0.3046 +[2026-01-29T21:47:22.424038Z] Loop 1088: Loss: 5.59e-03, Avg Return: 0.374, Regret: 0.4372, Entropy: 0.3026 +[2026-01-29T21:47:23.583522Z] Loop 1089: Loss: 5.18e-03, Avg Return: 0.374, Regret: 0.4372, Entropy: 0.2969 +[2026-01-29T21:47:24.788490Z] Loop 1090: Loss: 5.15e-03, Avg Return: 0.369, Regret: 0.4297, Entropy: 0.3111 +[2026-01-29T21:47:25.949674Z] Loop 1091: Loss: 5.23e-03, Avg Return: 0.380, Regret: 0.4297, Entropy: 0.3290 +[2026-01-29T21:47:27.113457Z] Loop 1092: Loss: 5.36e-03, Avg Return: 0.380, Regret: 0.4297, Entropy: 0.3583 +[2026-01-29T21:47:28.272461Z] Loop 1093: Loss: 5.45e-03, Avg Return: 0.383, Regret: 0.4297, Entropy: 0.3693 +[2026-01-29T21:47:29.434403Z] Loop 1094: Loss: 5.17e-03, Avg Return: 0.372, Regret: 0.4297, Entropy: 0.3813 +[2026-01-29T21:47:30.643822Z] Loop 1095: Loss: 5.98e-03, Avg Return: 0.385, Regret: 0.4274, Entropy: 0.3817 +[2026-01-29T21:47:31.804483Z] Loop 1096: Loss: 5.18e-03, Avg Return: 0.377, Regret: 0.4274, Entropy: 0.3714 +[2026-01-29T21:47:32.964878Z] Loop 1097: Loss: 5.11e-03, Avg Return: 0.375, Regret: 0.4274, Entropy: 0.3662 +[2026-01-29T21:47:34.127533Z] Loop 1098: Loss: 5.06e-03, Avg Return: 0.381, Regret: 0.4274, Entropy: 0.3708 +[2026-01-29T21:47:35.290883Z] Loop 1099: Loss: 5.22e-03, Avg Return: 0.376, Regret: 0.4274, Entropy: 0.3810 +[2026-01-29T21:47:36.494490Z] Loop 1100: Loss: 5.86e-03, Avg Return: 0.378, Regret: 0.4258, Entropy: 0.3806 +[2026-01-29T21:47:37.652958Z] Loop 1101: Loss: 4.92e-03, Avg Return: 0.369, Regret: 0.4258, Entropy: 0.3770 +[2026-01-29T21:47:38.812866Z] Loop 1102: Loss: 5.38e-03, Avg Return: 0.374, Regret: 0.4258, Entropy: 0.3240 +[2026-01-29T21:47:39.971848Z] Loop 1103: Loss: 4.75e-03, Avg Return: 0.375, Regret: 0.4258, Entropy: 0.2809 +[2026-01-29T21:47:41.131644Z] Loop 1104: Loss: 4.73e-03, Avg Return: 0.375, Regret: 0.4258, Entropy: 0.2522 +[2026-01-29T21:47:42.334441Z] Loop 1105: Loss: 4.83e-03, Avg Return: 0.377, Regret: 0.4286, Entropy: 0.2476 +[2026-01-29T21:47:43.493692Z] Loop 1106: Loss: 4.86e-03, Avg Return: 0.378, Regret: 0.4286, Entropy: 0.2645 +[2026-01-29T21:47:44.653161Z] Loop 1107: Loss: 4.58e-03, Avg Return: 0.377, Regret: 0.4286, Entropy: 0.3244 +[2026-01-29T21:47:45.813002Z] Loop 1108: Loss: 5.24e-03, Avg Return: 0.374, Regret: 0.4286, Entropy: 0.3633 +[2026-01-29T21:47:46.971608Z] Loop 1109: Loss: 5.25e-03, Avg Return: 0.382, Regret: 0.4286, Entropy: 0.3357 +[2026-01-29T21:47:48.174976Z] Loop 1110: Loss: 5.03e-03, Avg Return: 0.379, Regret: 0.4260, Entropy: 0.2861 +[2026-01-29T21:47:49.336076Z] Loop 1111: Loss: 4.57e-03, Avg Return: 0.376, Regret: 0.4260, Entropy: 0.3016 +[2026-01-29T21:47:50.496696Z] Loop 1112: Loss: 5.04e-03, Avg Return: 0.378, Regret: 0.4260, Entropy: 0.3263 +[2026-01-29T21:47:51.655739Z] Loop 1113: Loss: 5.14e-03, Avg Return: 0.381, Regret: 0.4260, Entropy: 0.3494 +[2026-01-29T21:47:52.815836Z] Loop 1114: Loss: 5.59e-03, Avg Return: 0.383, Regret: 0.4260, Entropy: 0.3541 +[2026-01-29T21:47:54.022641Z] Loop 1115: Loss: 5.51e-03, Avg Return: 0.385, Regret: 0.4220, Entropy: 0.3464 +[2026-01-29T21:47:55.187996Z] Loop 1116: Loss: 5.18e-03, Avg Return: 0.379, Regret: 0.4220, Entropy: 0.3231 +[2026-01-29T21:47:56.348367Z] Loop 1117: Loss: 4.63e-03, Avg Return: 0.379, Regret: 0.4220, Entropy: 0.3085 +[2026-01-29T21:47:57.513022Z] Loop 1118: Loss: 4.93e-03, Avg Return: 0.390, Regret: 0.4220, Entropy: 0.2946 +[2026-01-29T21:47:58.673888Z] Loop 1119: Loss: 4.68e-03, Avg Return: 0.386, Regret: 0.4220, Entropy: 0.2789 +[2026-01-29T21:47:59.876797Z] Loop 1120: Loss: 4.33e-03, Avg Return: 0.379, Regret: 0.4233, Entropy: 0.2576 +[2026-01-29T21:48:01.038596Z] Loop 1121: Loss: 4.44e-03, Avg Return: 0.374, Regret: 0.4233, Entropy: 0.2493 +[2026-01-29T21:48:02.198387Z] Loop 1122: Loss: 4.48e-03, Avg Return: 0.381, Regret: 0.4233, Entropy: 0.2544 +[2026-01-29T21:48:03.358717Z] Loop 1123: Loss: 4.38e-03, Avg Return: 0.375, Regret: 0.4233, Entropy: 0.2581 +[2026-01-29T21:48:04.518404Z] Loop 1124: Loss: 4.52e-03, Avg Return: 0.378, Regret: 0.4233, Entropy: 0.2598 +[2026-01-29T21:48:05.726261Z] Loop 1125: Loss: 4.32e-03, Avg Return: 0.378, Regret: 0.4219, Entropy: 0.2579 +[2026-01-29T21:48:06.885902Z] Loop 1126: Loss: 4.52e-03, Avg Return: 0.378, Regret: 0.4219, Entropy: 0.2720 +[2026-01-29T21:48:08.050960Z] Loop 1127: Loss: 4.64e-03, Avg Return: 0.380, Regret: 0.4219, Entropy: 0.3017 +[2026-01-29T21:48:09.211430Z] Loop 1128: Loss: 4.24e-03, Avg Return: 0.394, Regret: 0.4219, Entropy: 0.3248 +[2026-01-29T21:48:10.374178Z] Loop 1129: Loss: 5.60e-03, Avg Return: 0.389, Regret: 0.4219, Entropy: 0.3345 +[2026-01-29T21:48:11.584779Z] Loop 1130: Loss: 4.90e-03, Avg Return: 0.390, Regret: 0.4170, Entropy: 0.3510 +[2026-01-29T21:48:12.744154Z] Loop 1131: Loss: 4.90e-03, Avg Return: 0.378, Regret: 0.4170, Entropy: 0.3497 +[2026-01-29T21:48:13.902719Z] Loop 1132: Loss: 4.64e-03, Avg Return: 0.383, Regret: 0.4170, Entropy: 0.3568 +[2026-01-29T21:48:15.062031Z] Loop 1133: Loss: 5.27e-03, Avg Return: 0.390, Regret: 0.4170, Entropy: 0.3312 +[2026-01-29T21:48:16.221461Z] Loop 1134: Loss: 4.88e-03, Avg Return: 0.390, Regret: 0.4170, Entropy: 0.3111 +[2026-01-29T21:48:17.426497Z] Loop 1135: Loss: 4.80e-03, Avg Return: 0.391, Regret: 0.4156, Entropy: 0.3246 +[2026-01-29T21:48:18.585553Z] Loop 1136: Loss: 5.00e-03, Avg Return: 0.386, Regret: 0.4156, Entropy: 0.3225 +[2026-01-29T21:48:19.744464Z] Loop 1137: Loss: 5.44e-03, Avg Return: 0.395, Regret: 0.4156, Entropy: 0.3363 +[2026-01-29T21:48:20.903395Z] Loop 1138: Loss: 5.23e-03, Avg Return: 0.388, Regret: 0.4156, Entropy: 0.3482 +[2026-01-29T21:48:22.062934Z] Loop 1139: Loss: 5.20e-03, Avg Return: 0.379, Regret: 0.4156, Entropy: 0.3514 +[2026-01-29T21:48:23.267141Z] Loop 1140: Loss: 5.58e-03, Avg Return: 0.392, Regret: 0.4132, Entropy: 0.3414 +[2026-01-29T21:48:24.427180Z] Loop 1141: Loss: 5.21e-03, Avg Return: 0.392, Regret: 0.4132, Entropy: 0.3292 +[2026-01-29T21:48:25.586383Z] Loop 1142: Loss: 5.79e-03, Avg Return: 0.388, Regret: 0.4132, Entropy: 0.3025 +[2026-01-29T21:48:26.747125Z] Loop 1143: Loss: 5.90e-03, Avg Return: 0.396, Regret: 0.4132, Entropy: 0.3005 +[2026-01-29T21:48:27.907913Z] Loop 1144: Loss: 5.73e-03, Avg Return: 0.398, Regret: 0.4132, Entropy: 0.3191 +[2026-01-29T21:48:29.113568Z] Loop 1145: Loss: 5.56e-03, Avg Return: 0.392, Regret: 0.4118, Entropy: 0.3361 +[2026-01-29T21:48:30.272959Z] Loop 1146: Loss: 5.45e-03, Avg Return: 0.391, Regret: 0.4118, Entropy: 0.3543 +[2026-01-29T21:48:31.432992Z] Loop 1147: Loss: 5.21e-03, Avg Return: 0.390, Regret: 0.4118, Entropy: 0.3435 +[2026-01-29T21:48:32.592750Z] Loop 1148: Loss: 5.92e-03, Avg Return: 0.391, Regret: 0.4118, Entropy: 0.3306 +[2026-01-29T21:48:33.753259Z] Loop 1149: Loss: 5.64e-03, Avg Return: 0.393, Regret: 0.4118, Entropy: 0.3255 +[2026-01-29T21:48:34.959049Z] Loop 1150: Loss: 5.63e-03, Avg Return: 0.396, Regret: 0.4083, Entropy: 0.3254 +[2026-01-29T21:48:36.121277Z] Loop 1151: Loss: 5.28e-03, Avg Return: 0.395, Regret: 0.4083, Entropy: 0.3164 +[2026-01-29T21:48:37.281520Z] Loop 1152: Loss: 4.99e-03, Avg Return: 0.389, Regret: 0.4083, Entropy: 0.3097 +[2026-01-29T21:48:38.444633Z] Loop 1153: Loss: 5.39e-03, Avg Return: 0.401, Regret: 0.4083, Entropy: 0.3091 +[2026-01-29T21:48:39.604852Z] Loop 1154: Loss: 5.13e-03, Avg Return: 0.395, Regret: 0.4083, Entropy: 0.3010 +[2026-01-29T21:48:40.809816Z] Loop 1155: Loss: 5.54e-03, Avg Return: 0.396, Regret: 0.4062, Entropy: 0.3189 +[2026-01-29T21:48:41.971284Z] Loop 1156: Loss: 5.50e-03, Avg Return: 0.399, Regret: 0.4062, Entropy: 0.3332 +[2026-01-29T21:48:43.133685Z] Loop 1157: Loss: 5.85e-03, Avg Return: 0.407, Regret: 0.4062, Entropy: 0.3378 +[2026-01-29T21:48:44.295262Z] Loop 1158: Loss: 5.25e-03, Avg Return: 0.396, Regret: 0.4062, Entropy: 0.3350 +[2026-01-29T21:48:45.454981Z] Loop 1159: Loss: 5.83e-03, Avg Return: 0.398, Regret: 0.4062, Entropy: 0.3267 +[2026-01-29T21:48:46.662967Z] Loop 1160: Loss: 5.33e-03, Avg Return: 0.396, Regret: 0.4037, Entropy: 0.3244 +[2026-01-29T21:48:47.823167Z] Loop 1161: Loss: 5.38e-03, Avg Return: 0.402, Regret: 0.4037, Entropy: 0.3300 +[2026-01-29T21:48:48.983212Z] Loop 1162: Loss: 5.61e-03, Avg Return: 0.406, Regret: 0.4037, Entropy: 0.3223 +[2026-01-29T21:48:50.143239Z] Loop 1163: Loss: 5.50e-03, Avg Return: 0.404, Regret: 0.4037, Entropy: 0.3235 +[2026-01-29T21:48:51.303549Z] Loop 1164: Loss: 5.43e-03, Avg Return: 0.393, Regret: 0.4037, Entropy: 0.3170 +[2026-01-29T21:48:52.508000Z] Loop 1165: Loss: 5.82e-03, Avg Return: 0.403, Regret: 0.4009, Entropy: 0.3247 +[2026-01-29T21:48:53.669289Z] Loop 1166: Loss: 5.34e-03, Avg Return: 0.408, Regret: 0.4009, Entropy: 0.3236 +[2026-01-29T21:48:54.828698Z] Loop 1167: Loss: 4.97e-03, Avg Return: 0.399, Regret: 0.4009, Entropy: 0.3287 +[2026-01-29T21:48:55.989813Z] Loop 1168: Loss: 5.86e-03, Avg Return: 0.403, Regret: 0.4009, Entropy: 0.3003 +[2026-01-29T21:48:57.148375Z] Loop 1169: Loss: 5.36e-03, Avg Return: 0.409, Regret: 0.4009, Entropy: 0.2964 +[2026-01-29T21:48:58.350121Z] Loop 1170: Loss: 5.18e-03, Avg Return: 0.396, Regret: 0.4025, Entropy: 0.2932 +[2026-01-29T21:48:59.508400Z] Loop 1171: Loss: 5.35e-03, Avg Return: 0.400, Regret: 0.4025, Entropy: 0.3024 +[2026-01-29T21:49:00.667066Z] Loop 1172: Loss: 5.47e-03, Avg Return: 0.401, Regret: 0.4025, Entropy: 0.3224 +[2026-01-29T21:49:01.826559Z] Loop 1173: Loss: 5.43e-03, Avg Return: 0.415, Regret: 0.4025, Entropy: 0.3111 +[2026-01-29T21:49:02.986747Z] Loop 1174: Loss: 5.78e-03, Avg Return: 0.403, Regret: 0.4025, Entropy: 0.3016 +[2026-01-29T21:49:04.190823Z] Loop 1175: Loss: 5.79e-03, Avg Return: 0.406, Regret: 0.3981, Entropy: 0.2890 +[2026-01-29T21:49:05.350786Z] Loop 1176: Loss: 5.88e-03, Avg Return: 0.408, Regret: 0.3981, Entropy: 0.2951 +[2026-01-29T21:49:06.509271Z] Loop 1177: Loss: 5.35e-03, Avg Return: 0.413, Regret: 0.3981, Entropy: 0.3025 +[2026-01-29T21:49:07.667208Z] Loop 1178: Loss: 5.87e-03, Avg Return: 0.413, Regret: 0.3981, Entropy: 0.3154 +[2026-01-29T21:49:08.826560Z] Loop 1179: Loss: 5.65e-03, Avg Return: 0.415, Regret: 0.3981, Entropy: 0.3058 +[2026-01-29T21:49:10.029891Z] Loop 1180: Loss: 5.45e-03, Avg Return: 0.403, Regret: 0.3968, Entropy: 0.2921 +[2026-01-29T21:49:11.189448Z] Loop 1181: Loss: 5.12e-03, Avg Return: 0.394, Regret: 0.3968, Entropy: 0.2823 +[2026-01-29T21:49:12.348396Z] Loop 1182: Loss: 5.18e-03, Avg Return: 0.404, Regret: 0.3968, Entropy: 0.2776 +[2026-01-29T21:49:13.507445Z] Loop 1183: Loss: 5.30e-03, Avg Return: 0.409, Regret: 0.3968, Entropy: 0.2937 +[2026-01-29T21:49:14.668182Z] Loop 1184: Loss: 4.97e-03, Avg Return: 0.406, Regret: 0.3968, Entropy: 0.3184 +[2026-01-29T21:49:15.873277Z] Loop 1185: Loss: 5.84e-03, Avg Return: 0.418, Regret: 0.3897, Entropy: 0.3231 +[2026-01-29T21:49:17.031900Z] Loop 1186: Loss: 6.65e-03, Avg Return: 0.410, Regret: 0.3897, Entropy: 0.2895 +[2026-01-29T21:49:18.191330Z] Loop 1187: Loss: 6.32e-03, Avg Return: 0.406, Regret: 0.3897, Entropy: 0.2822 +[2026-01-29T21:49:19.350396Z] Loop 1188: Loss: 6.27e-03, Avg Return: 0.392, Regret: 0.3897, Entropy: 0.2479 +[2026-01-29T21:49:20.509341Z] Loop 1189: Loss: 6.67e-03, Avg Return: 0.402, Regret: 0.3897, Entropy: 0.2392 +[2026-01-29T21:49:21.715723Z] Loop 1190: Loss: 6.15e-03, Avg Return: 0.390, Regret: 0.4087, Entropy: 0.2362 +[2026-01-29T21:49:22.875929Z] Loop 1191: Loss: 6.67e-03, Avg Return: 0.402, Regret: 0.4087, Entropy: 0.2472 +[2026-01-29T21:49:24.034726Z] Loop 1192: Loss: 6.22e-03, Avg Return: 0.409, Regret: 0.4087, Entropy: 0.2697 +[2026-01-29T21:49:25.194648Z] Loop 1193: Loss: 6.83e-03, Avg Return: 0.421, Regret: 0.4087, Entropy: 0.3078 +[2026-01-29T21:49:26.355764Z] Loop 1194: Loss: 5.90e-03, Avg Return: 0.415, Regret: 0.4087, Entropy: 0.3171 +[2026-01-29T21:49:27.561357Z] Loop 1195: Loss: 5.20e-03, Avg Return: 0.413, Regret: 0.3916, Entropy: 0.3009 +[2026-01-29T21:49:28.721418Z] Loop 1196: Loss: 5.04e-03, Avg Return: 0.410, Regret: 0.3916, Entropy: 0.2790 +[2026-01-29T21:49:29.881890Z] Loop 1197: Loss: 5.11e-03, Avg Return: 0.410, Regret: 0.3916, Entropy: 0.2889 +[2026-01-29T21:49:31.044060Z] Loop 1198: Loss: 5.12e-03, Avg Return: 0.416, Regret: 0.3916, Entropy: 0.2934 +[2026-01-29T21:49:32.203025Z] Loop 1199: Loss: 5.81e-03, Avg Return: 0.424, Regret: 0.3916, Entropy: 0.2998 +[2026-01-29T21:49:33.404841Z] Loop 1200: Loss: 6.20e-03, Avg Return: 0.418, Regret: 0.3852, Entropy: 0.3106 +[2026-01-29T21:49:34.564713Z] Loop 1201: Loss: 5.90e-03, Avg Return: 0.416, Regret: 0.3852, Entropy: 0.3072 +[2026-01-29T21:49:35.723984Z] Loop 1202: Loss: 5.85e-03, Avg Return: 0.424, Regret: 0.3852, Entropy: 0.3005 +[2026-01-29T21:49:36.883250Z] Loop 1203: Loss: 5.91e-03, Avg Return: 0.416, Regret: 0.3852, Entropy: 0.3071 +[2026-01-29T21:49:38.044006Z] Loop 1204: Loss: 6.75e-03, Avg Return: 0.428, Regret: 0.3852, Entropy: 0.3033 +[2026-01-29T21:49:39.248270Z] Loop 1205: Loss: 6.43e-03, Avg Return: 0.423, Regret: 0.3816, Entropy: 0.2896 +[2026-01-29T21:49:40.410208Z] Loop 1206: Loss: 6.48e-03, Avg Return: 0.418, Regret: 0.3816, Entropy: 0.2665 +[2026-01-29T21:49:41.572749Z] Loop 1207: Loss: 6.14e-03, Avg Return: 0.411, Regret: 0.3816, Entropy: 0.2599 +[2026-01-29T21:49:42.733384Z] Loop 1208: Loss: 7.12e-03, Avg Return: 0.425, Regret: 0.3816, Entropy: 0.2646 +[2026-01-29T21:49:43.892828Z] Loop 1209: Loss: 6.92e-03, Avg Return: 0.413, Regret: 0.3816, Entropy: 0.2622 +[2026-01-29T21:49:45.104426Z] Loop 1210: Loss: 6.00e-03, Avg Return: 0.420, Regret: 0.3830, Entropy: 0.2692 +[2026-01-29T21:49:46.266799Z] Loop 1211: Loss: 6.65e-03, Avg Return: 0.425, Regret: 0.3830, Entropy: 0.2763 +[2026-01-29T21:49:47.426809Z] Loop 1212: Loss: 7.31e-03, Avg Return: 0.428, Regret: 0.3830, Entropy: 0.2851 +[2026-01-29T21:49:48.586054Z] Loop 1213: Loss: 6.86e-03, Avg Return: 0.424, Regret: 0.3830, Entropy: 0.2832 +[2026-01-29T21:49:49.746205Z] Loop 1214: Loss: 6.35e-03, Avg Return: 0.433, Regret: 0.3830, Entropy: 0.2794 +[2026-01-29T21:49:50.952592Z] Loop 1215: Loss: 6.65e-03, Avg Return: 0.428, Regret: 0.3773, Entropy: 0.2841 +[2026-01-29T21:49:52.115011Z] Loop 1216: Loss: 6.23e-03, Avg Return: 0.420, Regret: 0.3773, Entropy: 0.2940 +[2026-01-29T21:49:53.275421Z] Loop 1217: Loss: 6.84e-03, Avg Return: 0.425, Regret: 0.3773, Entropy: 0.2850 +[2026-01-29T21:49:54.436135Z] Loop 1218: Loss: 6.43e-03, Avg Return: 0.427, Regret: 0.3773, Entropy: 0.2861 +[2026-01-29T21:49:55.596217Z] Loop 1219: Loss: 7.08e-03, Avg Return: 0.432, Regret: 0.3773, Entropy: 0.2803 +[2026-01-29T21:49:56.802546Z] Loop 1220: Loss: 6.44e-03, Avg Return: 0.425, Regret: 0.3752, Entropy: 0.2957 +[2026-01-29T21:49:57.962261Z] Loop 1221: Loss: 6.68e-03, Avg Return: 0.434, Regret: 0.3752, Entropy: 0.2880 +[2026-01-29T21:49:59.122305Z] Loop 1222: Loss: 6.07e-03, Avg Return: 0.431, Regret: 0.3752, Entropy: 0.2808 +[2026-01-29T21:50:00.283538Z] Loop 1223: Loss: 5.27e-03, Avg Return: 0.419, Regret: 0.3752, Entropy: 0.2731 +[2026-01-29T21:50:01.443169Z] Loop 1224: Loss: 5.80e-03, Avg Return: 0.422, Regret: 0.3752, Entropy: 0.2680 +[2026-01-29T21:50:02.650812Z] Loop 1225: Loss: 4.93e-03, Avg Return: 0.417, Regret: 0.3816, Entropy: 0.2705 +[2026-01-29T21:50:03.815474Z] Loop 1226: Loss: 5.70e-03, Avg Return: 0.429, Regret: 0.3816, Entropy: 0.2705 +[2026-01-29T21:50:04.974186Z] Loop 1227: Loss: 6.83e-03, Avg Return: 0.432, Regret: 0.3816, Entropy: 0.2843 +[2026-01-29T21:50:06.133043Z] Loop 1228: Loss: 6.07e-03, Avg Return: 0.432, Regret: 0.3816, Entropy: 0.2929 +[2026-01-29T21:50:07.294657Z] Loop 1229: Loss: 6.63e-03, Avg Return: 0.431, Regret: 0.3816, Entropy: 0.2779 +[2026-01-29T21:50:08.500768Z] Loop 1230: Loss: 6.86e-03, Avg Return: 0.428, Regret: 0.3762, Entropy: 0.2527 +[2026-01-29T21:50:09.663453Z] Loop 1231: Loss: 6.58e-03, Avg Return: 0.424, Regret: 0.3762, Entropy: 0.2462 +[2026-01-29T21:50:10.823295Z] Loop 1232: Loss: 6.65e-03, Avg Return: 0.426, Regret: 0.3762, Entropy: 0.2422 +[2026-01-29T21:50:11.985095Z] Loop 1233: Loss: 6.40e-03, Avg Return: 0.419, Regret: 0.3762, Entropy: 0.2368 +[2026-01-29T21:50:13.147959Z] Loop 1234: Loss: 7.12e-03, Avg Return: 0.427, Regret: 0.3762, Entropy: 0.2526 +[2026-01-29T21:50:14.353525Z] Loop 1235: Loss: 6.55e-03, Avg Return: 0.439, Regret: 0.3723, Entropy: 0.2682 +[2026-01-29T21:50:15.512770Z] Loop 1236: Loss: 6.19e-03, Avg Return: 0.431, Regret: 0.3723, Entropy: 0.2743 +[2026-01-29T21:50:16.674556Z] Loop 1237: Loss: 5.62e-03, Avg Return: 0.432, Regret: 0.3723, Entropy: 0.2538 +[2026-01-29T21:50:17.835440Z] Loop 1238: Loss: 4.68e-03, Avg Return: 0.426, Regret: 0.3723, Entropy: 0.2585 +[2026-01-29T21:50:18.995843Z] Loop 1239: Loss: 5.25e-03, Avg Return: 0.433, Regret: 0.3723, Entropy: 0.2461 +[2026-01-29T21:50:20.202693Z] Loop 1240: Loss: 4.95e-03, Avg Return: 0.428, Regret: 0.3749, Entropy: 0.2527 +[2026-01-29T21:50:21.363529Z] Loop 1241: Loss: 5.53e-03, Avg Return: 0.436, Regret: 0.3749, Entropy: 0.2543 +[2026-01-29T21:50:22.524065Z] Loop 1242: Loss: 5.30e-03, Avg Return: 0.425, Regret: 0.3749, Entropy: 0.2553 +[2026-01-29T21:50:23.684850Z] Loop 1243: Loss: 5.09e-03, Avg Return: 0.430, Regret: 0.3749, Entropy: 0.2542 +[2026-01-29T21:50:24.844661Z] Loop 1244: Loss: 5.39e-03, Avg Return: 0.428, Regret: 0.3749, Entropy: 0.2641 +[2026-01-29T21:50:26.050425Z] Loop 1245: Loss: 6.56e-03, Avg Return: 0.441, Regret: 0.3708, Entropy: 0.2582 +[2026-01-29T21:50:27.209276Z] Loop 1246: Loss: 6.05e-03, Avg Return: 0.434, Regret: 0.3708, Entropy: 0.2657 +[2026-01-29T21:50:28.368639Z] Loop 1247: Loss: 5.74e-03, Avg Return: 0.429, Regret: 0.3708, Entropy: 0.2553 +[2026-01-29T21:50:29.527396Z] Loop 1248: Loss: 6.69e-03, Avg Return: 0.435, Regret: 0.3708, Entropy: 0.2559 +[2026-01-29T21:50:30.686924Z] Loop 1249: Loss: 6.10e-03, Avg Return: 0.428, Regret: 0.3708, Entropy: 0.2554 +[2026-01-29T21:50:31.891904Z] Loop 1250: Loss: 6.47e-03, Avg Return: 0.430, Regret: 0.3709, Entropy: 0.2528 +[2026-01-29T21:50:33.052391Z] Loop 1251: Loss: 6.23e-03, Avg Return: 0.439, Regret: 0.3709, Entropy: 0.2507 +[2026-01-29T21:50:34.212081Z] Loop 1252: Loss: 6.23e-03, Avg Return: 0.435, Regret: 0.3709, Entropy: 0.2500 +[2026-01-29T21:50:35.373422Z] Loop 1253: Loss: 6.10e-03, Avg Return: 0.432, Regret: 0.3709, Entropy: 0.2537 +[2026-01-29T21:50:36.533880Z] Loop 1254: Loss: 6.15e-03, Avg Return: 0.437, Regret: 0.3709, Entropy: 0.2564 +[2026-01-29T21:50:37.739423Z] Loop 1255: Loss: 5.36e-03, Avg Return: 0.441, Regret: 0.3698, Entropy: 0.2578 +[2026-01-29T21:50:38.898195Z] Loop 1256: Loss: 5.56e-03, Avg Return: 0.430, Regret: 0.3698, Entropy: 0.2537 +[2026-01-29T21:50:40.058686Z] Loop 1257: Loss: 5.23e-03, Avg Return: 0.433, Regret: 0.3698, Entropy: 0.2541 +[2026-01-29T21:50:41.218839Z] Loop 1258: Loss: 5.52e-03, Avg Return: 0.441, Regret: 0.3698, Entropy: 0.2623 +[2026-01-29T21:50:42.378641Z] Loop 1259: Loss: 5.88e-03, Avg Return: 0.434, Regret: 0.3698, Entropy: 0.2577 +[2026-01-29T21:50:43.588249Z] Loop 1260: Loss: 5.76e-03, Avg Return: 0.439, Regret: 0.3695, Entropy: 0.2593 +[2026-01-29T21:50:44.749540Z] Loop 1261: Loss: 5.77e-03, Avg Return: 0.433, Regret: 0.3695, Entropy: 0.2635 +[2026-01-29T21:50:45.908301Z] Loop 1262: Loss: 5.72e-03, Avg Return: 0.432, Regret: 0.3695, Entropy: 0.2651 +[2026-01-29T21:50:47.067158Z] Loop 1263: Loss: 6.38e-03, Avg Return: 0.439, Regret: 0.3695, Entropy: 0.2644 +[2026-01-29T21:50:48.227117Z] Loop 1264: Loss: 5.91e-03, Avg Return: 0.435, Regret: 0.3695, Entropy: 0.2579 +[2026-01-29T21:50:49.432749Z] Loop 1265: Loss: 6.21e-03, Avg Return: 0.431, Regret: 0.3696, Entropy: 0.2575 +[2026-01-29T21:50:50.592541Z] Loop 1266: Loss: 6.25e-03, Avg Return: 0.436, Regret: 0.3696, Entropy: 0.2571 +[2026-01-29T21:50:51.752311Z] Loop 1267: Loss: 6.29e-03, Avg Return: 0.438, Regret: 0.3696, Entropy: 0.2510 +[2026-01-29T21:50:52.911074Z] Loop 1268: Loss: 6.35e-03, Avg Return: 0.430, Regret: 0.3696, Entropy: 0.2556 +[2026-01-29T21:50:54.069971Z] Loop 1269: Loss: 6.48e-03, Avg Return: 0.429, Regret: 0.3696, Entropy: 0.2421 +[2026-01-29T21:50:55.277963Z] Loop 1270: Loss: 6.56e-03, Avg Return: 0.429, Regret: 0.3760, Entropy: 0.2447 +[2026-01-29T21:50:56.437837Z] Loop 1271: Loss: 6.51e-03, Avg Return: 0.424, Regret: 0.3760, Entropy: 0.2423 +[2026-01-29T21:50:57.597224Z] Loop 1272: Loss: 6.15e-03, Avg Return: 0.420, Regret: 0.3760, Entropy: 0.2354 +[2026-01-29T21:50:58.756161Z] Loop 1273: Loss: 6.78e-03, Avg Return: 0.435, Regret: 0.3760, Entropy: 0.2462 +[2026-01-29T21:50:59.916417Z] Loop 1274: Loss: 6.27e-03, Avg Return: 0.438, Regret: 0.3760, Entropy: 0.2511 +[2026-01-29T21:51:01.122001Z] Loop 1275: Loss: 5.61e-03, Avg Return: 0.441, Regret: 0.3680, Entropy: 0.2519 +[2026-01-29T21:51:02.280829Z] Loop 1276: Loss: 4.97e-03, Avg Return: 0.436, Regret: 0.3680, Entropy: 0.2458 +[2026-01-29T21:51:03.440471Z] Loop 1277: Loss: 4.63e-03, Avg Return: 0.423, Regret: 0.3680, Entropy: 0.2349 +[2026-01-29T21:51:04.600868Z] Loop 1278: Loss: 4.60e-03, Avg Return: 0.428, Regret: 0.3680, Entropy: 0.2078 +[2026-01-29T21:51:05.760387Z] Loop 1279: Loss: 3.70e-03, Avg Return: 0.423, Regret: 0.3680, Entropy: 0.2068 +[2026-01-29T21:51:06.967156Z] Loop 1280: Loss: 4.05e-03, Avg Return: 0.426, Regret: 0.3772, Entropy: 0.2068 +[2026-01-29T21:51:08.128292Z] Loop 1281: Loss: 4.15e-03, Avg Return: 0.431, Regret: 0.3772, Entropy: 0.2108 +[2026-01-29T21:51:09.288998Z] Loop 1282: Loss: 4.64e-03, Avg Return: 0.433, Regret: 0.3772, Entropy: 0.2250 +[2026-01-29T21:51:10.448568Z] Loop 1283: Loss: 5.27e-03, Avg Return: 0.437, Regret: 0.3772, Entropy: 0.2413 +[2026-01-29T21:51:11.610084Z] Loop 1284: Loss: 5.09e-03, Avg Return: 0.435, Regret: 0.3772, Entropy: 0.2462 +[2026-01-29T21:51:12.817174Z] Loop 1285: Loss: 6.09e-03, Avg Return: 0.439, Regret: 0.3673, Entropy: 0.2434 +[2026-01-29T21:51:13.977109Z] Loop 1286: Loss: 5.29e-03, Avg Return: 0.430, Regret: 0.3673, Entropy: 0.2343 +[2026-01-29T21:51:15.135976Z] Loop 1287: Loss: 6.03e-03, Avg Return: 0.433, Regret: 0.3673, Entropy: 0.2292 +[2026-01-29T21:51:16.298971Z] Loop 1288: Loss: 5.73e-03, Avg Return: 0.429, Regret: 0.3673, Entropy: 0.2186 +[2026-01-29T21:51:17.476185Z] Loop 1289: Loss: 5.88e-03, Avg Return: 0.423, Regret: 0.3673, Entropy: 0.2180 +[2026-01-29T21:51:18.687702Z] Loop 1290: Loss: 6.49e-03, Avg Return: 0.427, Regret: 0.3819, Entropy: 0.2127 +[2026-01-29T21:51:19.849492Z] Loop 1291: Loss: 6.69e-03, Avg Return: 0.432, Regret: 0.3819, Entropy: 0.2146 +[2026-01-29T21:51:21.009453Z] Loop 1292: Loss: 5.73e-03, Avg Return: 0.438, Regret: 0.3819, Entropy: 0.2188 +[2026-01-29T21:51:22.171109Z] Loop 1293: Loss: 5.49e-03, Avg Return: 0.441, Regret: 0.3819, Entropy: 0.2329 +[2026-01-29T21:51:23.330999Z] Loop 1294: Loss: 4.91e-03, Avg Return: 0.432, Regret: 0.3819, Entropy: 0.2210 +[2026-01-29T21:51:24.546619Z] Loop 1295: Loss: 4.11e-03, Avg Return: 0.435, Regret: 0.3738, Entropy: 0.2026 +[2026-01-29T21:51:25.709819Z] Loop 1296: Loss: 3.69e-03, Avg Return: 0.421, Regret: 0.3738, Entropy: 0.1880 +[2026-01-29T21:51:26.870969Z] Loop 1297: Loss: 4.54e-03, Avg Return: 0.409, Regret: 0.3738, Entropy: 0.1820 +[2026-01-29T21:51:28.030262Z] Loop 1298: Loss: 4.08e-03, Avg Return: 0.424, Regret: 0.3738, Entropy: 0.1807 +[2026-01-29T21:51:29.189742Z] Loop 1299: Loss: 3.45e-03, Avg Return: 0.421, Regret: 0.3738, Entropy: 0.1937 +[2026-01-29T21:51:30.398303Z] Loop 1300: Loss: 4.09e-03, Avg Return: 0.432, Regret: 0.3746, Entropy: 0.1992 +[2026-01-29T21:51:31.559723Z] Loop 1301: Loss: 3.88e-03, Avg Return: 0.426, Regret: 0.3746, Entropy: 0.2025 +[2026-01-29T21:51:32.722524Z] Loop 1302: Loss: 4.37e-03, Avg Return: 0.433, Regret: 0.3746, Entropy: 0.2053 +[2026-01-29T21:51:33.887057Z] Loop 1303: Loss: 4.29e-03, Avg Return: 0.440, Regret: 0.3746, Entropy: 0.2149 +[2026-01-29T21:51:35.049358Z] Loop 1304: Loss: 4.55e-03, Avg Return: 0.434, Regret: 0.3746, Entropy: 0.2201 +[2026-01-29T21:51:36.259730Z] Loop 1305: Loss: 5.29e-03, Avg Return: 0.443, Regret: 0.3673, Entropy: 0.2292 +[2026-01-29T21:51:37.420790Z] Loop 1306: Loss: 5.34e-03, Avg Return: 0.432, Regret: 0.3673, Entropy: 0.2322 +[2026-01-29T21:51:38.581362Z] Loop 1307: Loss: 5.71e-03, Avg Return: 0.431, Regret: 0.3673, Entropy: 0.2216 +[2026-01-29T21:51:39.742285Z] Loop 1308: Loss: 5.52e-03, Avg Return: 0.428, Regret: 0.3673, Entropy: 0.2189 +[2026-01-29T21:51:40.903096Z] Loop 1309: Loss: 6.22e-03, Avg Return: 0.440, Regret: 0.3673, Entropy: 0.2223 +[2026-01-29T21:51:42.111982Z] Loop 1310: Loss: 6.16e-03, Avg Return: 0.437, Regret: 0.3724, Entropy: 0.2255 +[2026-01-29T21:51:43.272900Z] Loop 1311: Loss: 6.09e-03, Avg Return: 0.436, Regret: 0.3724, Entropy: 0.2159 +[2026-01-29T21:51:44.434291Z] Loop 1312: Loss: 6.08e-03, Avg Return: 0.427, Regret: 0.3724, Entropy: 0.2171 +[2026-01-29T21:51:45.594699Z] Loop 1313: Loss: 6.42e-03, Avg Return: 0.436, Regret: 0.3724, Entropy: 0.2120 +[2026-01-29T21:51:46.756303Z] Loop 1314: Loss: 5.62e-03, Avg Return: 0.436, Regret: 0.3724, Entropy: 0.2184 +[2026-01-29T21:51:47.974323Z] Loop 1315: Loss: 5.76e-03, Avg Return: 0.447, Regret: 0.3672, Entropy: 0.2190 +[2026-01-29T21:51:49.135195Z] Loop 1316: Loss: 5.86e-03, Avg Return: 0.435, Regret: 0.3672, Entropy: 0.2231 +[2026-01-29T21:51:50.296583Z] Loop 1317: Loss: 5.52e-03, Avg Return: 0.439, Regret: 0.3672, Entropy: 0.2170 +[2026-01-29T21:51:51.456911Z] Loop 1318: Loss: 5.62e-03, Avg Return: 0.434, Regret: 0.3672, Entropy: 0.2201 +[2026-01-29T21:51:52.616670Z] Loop 1319: Loss: 5.49e-03, Avg Return: 0.442, Regret: 0.3672, Entropy: 0.2133 +[2026-01-29T21:51:53.823860Z] Loop 1320: Loss: 5.85e-03, Avg Return: 0.433, Regret: 0.3656, Entropy: 0.2234 +[2026-01-29T21:51:54.984019Z] Loop 1321: Loss: 5.49e-03, Avg Return: 0.430, Regret: 0.3656, Entropy: 0.2302 +[2026-01-29T21:51:56.143209Z] Loop 1322: Loss: 5.38e-03, Avg Return: 0.448, Regret: 0.3656, Entropy: 0.2293 +[2026-01-29T21:51:57.304158Z] Loop 1323: Loss: 4.95e-03, Avg Return: 0.440, Regret: 0.3656, Entropy: 0.2242 +[2026-01-29T21:51:58.464152Z] Loop 1324: Loss: 4.65e-03, Avg Return: 0.439, Regret: 0.3656, Entropy: 0.2237 +[2026-01-29T21:51:59.681225Z] Loop 1325: Loss: 4.28e-03, Avg Return: 0.438, Regret: 0.3675, Entropy: 0.2151 +[2026-01-29T21:52:00.843062Z] Loop 1326: Loss: 4.40e-03, Avg Return: 0.441, Regret: 0.3675, Entropy: 0.2038 +[2026-01-29T21:52:02.002900Z] Loop 1327: Loss: 4.57e-03, Avg Return: 0.440, Regret: 0.3675, Entropy: 0.2101 +[2026-01-29T21:52:03.162425Z] Loop 1328: Loss: 4.42e-03, Avg Return: 0.436, Regret: 0.3675, Entropy: 0.2037 +[2026-01-29T21:52:04.324633Z] Loop 1329: Loss: 4.35e-03, Avg Return: 0.425, Regret: 0.3675, Entropy: 0.2161 +[2026-01-29T21:52:05.533295Z] Loop 1330: Loss: 4.26e-03, Avg Return: 0.440, Regret: 0.3667, Entropy: 0.2164 +[2026-01-29T21:52:06.696590Z] Loop 1331: Loss: 4.57e-03, Avg Return: 0.433, Regret: 0.3667, Entropy: 0.2213 +[2026-01-29T21:52:07.857701Z] Loop 1332: Loss: 4.56e-03, Avg Return: 0.434, Regret: 0.3667, Entropy: 0.2187 +[2026-01-29T21:52:09.017005Z] Loop 1333: Loss: 4.76e-03, Avg Return: 0.441, Regret: 0.3667, Entropy: 0.2141 +[2026-01-29T21:52:10.179780Z] Loop 1334: Loss: 4.80e-03, Avg Return: 0.443, Regret: 0.3667, Entropy: 0.2210 +[2026-01-29T21:52:11.390330Z] Loop 1335: Loss: 5.26e-03, Avg Return: 0.441, Regret: 0.3654, Entropy: 0.2217 +[2026-01-29T21:52:12.557036Z] Loop 1336: Loss: 4.76e-03, Avg Return: 0.441, Regret: 0.3654, Entropy: 0.2246 +[2026-01-29T21:52:13.718149Z] Loop 1337: Loss: 4.83e-03, Avg Return: 0.439, Regret: 0.3654, Entropy: 0.2310 +[2026-01-29T21:52:14.879307Z] Loop 1338: Loss: 4.87e-03, Avg Return: 0.431, Regret: 0.3654, Entropy: 0.2300 +[2026-01-29T21:52:16.038862Z] Loop 1339: Loss: 5.30e-03, Avg Return: 0.436, Regret: 0.3654, Entropy: 0.2304 +[2026-01-29T21:52:17.243483Z] Loop 1340: Loss: 5.44e-03, Avg Return: 0.440, Regret: 0.3647, Entropy: 0.2247 +[2026-01-29T21:52:18.403770Z] Loop 1341: Loss: 5.00e-03, Avg Return: 0.444, Regret: 0.3647, Entropy: 0.2260 +[2026-01-29T21:52:19.567973Z] Loop 1342: Loss: 5.66e-03, Avg Return: 0.438, Regret: 0.3647, Entropy: 0.2170 +[2026-01-29T21:52:20.735981Z] Loop 1343: Loss: 5.03e-03, Avg Return: 0.435, Regret: 0.3647, Entropy: 0.2125 +[2026-01-29T21:52:21.897563Z] Loop 1344: Loss: 4.88e-03, Avg Return: 0.422, Regret: 0.3647, Entropy: 0.2117 +[2026-01-29T21:52:23.110114Z] Loop 1345: Loss: 5.78e-03, Avg Return: 0.437, Regret: 0.3675, Entropy: 0.2080 +[2026-01-29T21:52:24.271175Z] Loop 1346: Loss: 5.72e-03, Avg Return: 0.437, Regret: 0.3675, Entropy: 0.2068 +[2026-01-29T21:52:25.433062Z] Loop 1347: Loss: 5.07e-03, Avg Return: 0.430, Regret: 0.3675, Entropy: 0.2078 +[2026-01-29T21:52:26.593869Z] Loop 1348: Loss: 5.12e-03, Avg Return: 0.442, Regret: 0.3675, Entropy: 0.2045 +[2026-01-29T21:52:27.761652Z] Loop 1349: Loss: 4.83e-03, Avg Return: 0.434, Regret: 0.3675, Entropy: 0.2118 +[2026-01-29T21:52:28.976378Z] Loop 1350: Loss: 5.26e-03, Avg Return: 0.447, Regret: 0.3646, Entropy: 0.2145 +[2026-01-29T21:52:30.138135Z] Loop 1351: Loss: 5.20e-03, Avg Return: 0.443, Regret: 0.3646, Entropy: 0.2175 +[2026-01-29T21:52:31.298859Z] Loop 1352: Loss: 5.41e-03, Avg Return: 0.439, Regret: 0.3646, Entropy: 0.2202 +[2026-01-29T21:52:32.458775Z] Loop 1353: Loss: 5.27e-03, Avg Return: 0.431, Regret: 0.3646, Entropy: 0.2250 +[2026-01-29T21:52:33.619292Z] Loop 1354: Loss: 5.40e-03, Avg Return: 0.448, Regret: 0.3646, Entropy: 0.2345 +[2026-01-29T21:52:34.824151Z] Loop 1355: Loss: 4.74e-03, Avg Return: 0.439, Regret: 0.3649, Entropy: 0.2092 +[2026-01-29T21:52:35.986647Z] Loop 1356: Loss: 4.06e-03, Avg Return: 0.434, Regret: 0.3649, Entropy: 0.1985 +[2026-01-29T21:52:37.150499Z] Loop 1357: Loss: 4.01e-03, Avg Return: 0.437, Regret: 0.3649, Entropy: 0.1930 +[2026-01-29T21:52:38.314107Z] Loop 1358: Loss: 3.58e-03, Avg Return: 0.423, Regret: 0.3649, Entropy: 0.1803 +[2026-01-29T21:52:39.475409Z] Loop 1359: Loss: 3.63e-03, Avg Return: 0.427, Regret: 0.3649, Entropy: 0.1778 +[2026-01-29T21:52:40.694299Z] Loop 1360: Loss: 3.99e-03, Avg Return: 0.425, Regret: 0.3733, Entropy: 0.1782 +[2026-01-29T21:52:41.854504Z] Loop 1361: Loss: 4.04e-03, Avg Return: 0.428, Regret: 0.3733, Entropy: 0.1828 +[2026-01-29T21:52:43.014452Z] Loop 1362: Loss: 3.64e-03, Avg Return: 0.431, Regret: 0.3733, Entropy: 0.1893 +[2026-01-29T21:52:44.175263Z] Loop 1363: Loss: 3.86e-03, Avg Return: 0.439, Regret: 0.3733, Entropy: 0.1925 +[2026-01-29T21:52:45.335155Z] Loop 1364: Loss: 4.23e-03, Avg Return: 0.440, Regret: 0.3733, Entropy: 0.2046 +[2026-01-29T21:52:46.543754Z] Loop 1365: Loss: 4.65e-03, Avg Return: 0.443, Regret: 0.3644, Entropy: 0.2048 +[2026-01-29T21:52:47.705090Z] Loop 1366: Loss: 5.07e-03, Avg Return: 0.433, Regret: 0.3644, Entropy: 0.2139 +[2026-01-29T21:52:48.870073Z] Loop 1367: Loss: 4.72e-03, Avg Return: 0.442, Regret: 0.3644, Entropy: 0.2129 +[2026-01-29T21:52:50.033899Z] Loop 1368: Loss: 5.23e-03, Avg Return: 0.443, Regret: 0.3644, Entropy: 0.2227 +[2026-01-29T21:52:51.196258Z] Loop 1369: Loss: 5.05e-03, Avg Return: 0.441, Regret: 0.3644, Entropy: 0.2170 +[2026-01-29T21:52:52.409440Z] Loop 1370: Loss: 5.18e-03, Avg Return: 0.436, Regret: 0.3632, Entropy: 0.2194 +[2026-01-29T21:52:53.571666Z] Loop 1371: Loss: 5.94e-03, Avg Return: 0.442, Regret: 0.3632, Entropy: 0.2150 +[2026-01-29T21:52:54.731037Z] Loop 1372: Loss: 5.24e-03, Avg Return: 0.443, Regret: 0.3632, Entropy: 0.2144 +[2026-01-29T21:52:55.889738Z] Loop 1373: Loss: 4.83e-03, Avg Return: 0.444, Regret: 0.3632, Entropy: 0.2099 +[2026-01-29T21:52:57.049727Z] Loop 1374: Loss: 5.24e-03, Avg Return: 0.435, Regret: 0.3632, Entropy: 0.2155 +[2026-01-29T21:52:58.253525Z] Loop 1375: Loss: 5.46e-03, Avg Return: 0.434, Regret: 0.3639, Entropy: 0.2141 +[2026-01-29T21:52:59.412369Z] Loop 1376: Loss: 5.44e-03, Avg Return: 0.443, Regret: 0.3639, Entropy: 0.2181 +[2026-01-29T21:53:00.573157Z] Loop 1377: Loss: 5.42e-03, Avg Return: 0.434, Regret: 0.3639, Entropy: 0.2149 +[2026-01-29T21:53:01.731848Z] Loop 1378: Loss: 4.89e-03, Avg Return: 0.438, Regret: 0.3639, Entropy: 0.2164 +[2026-01-29T21:53:02.890161Z] Loop 1379: Loss: 4.56e-03, Avg Return: 0.436, Regret: 0.3639, Entropy: 0.2129 +[2026-01-29T21:53:04.095140Z] Loop 1380: Loss: 5.01e-03, Avg Return: 0.440, Regret: 0.3632, Entropy: 0.2085 +[2026-01-29T21:53:05.256147Z] Loop 1381: Loss: 4.87e-03, Avg Return: 0.438, Regret: 0.3632, Entropy: 0.2082 +[2026-01-29T21:53:06.415369Z] Loop 1382: Loss: 4.52e-03, Avg Return: 0.451, Regret: 0.3632, Entropy: 0.1963 +[2026-01-29T21:53:07.576881Z] Loop 1383: Loss: 4.56e-03, Avg Return: 0.438, Regret: 0.3632, Entropy: 0.2007 +[2026-01-29T21:53:08.739017Z] Loop 1384: Loss: 3.80e-03, Avg Return: 0.442, Regret: 0.3632, Entropy: 0.2014 +[2026-01-29T21:53:09.947649Z] Loop 1385: Loss: 4.21e-03, Avg Return: 0.447, Regret: 0.3644, Entropy: 0.2012 +[2026-01-29T21:53:11.112228Z] Loop 1386: Loss: 4.31e-03, Avg Return: 0.442, Regret: 0.3644, Entropy: 0.2069 +[2026-01-29T21:53:12.272751Z] Loop 1387: Loss: 4.78e-03, Avg Return: 0.439, Regret: 0.3644, Entropy: 0.1968 +[2026-01-29T21:53:13.436798Z] Loop 1388: Loss: 4.50e-03, Avg Return: 0.444, Regret: 0.3644, Entropy: 0.2048 +[2026-01-29T21:53:14.598442Z] Loop 1389: Loss: 4.73e-03, Avg Return: 0.431, Regret: 0.3644, Entropy: 0.2104 +[2026-01-29T21:53:15.815382Z] Loop 1390: Loss: 4.74e-03, Avg Return: 0.450, Regret: 0.3628, Entropy: 0.2007 +[2026-01-29T21:53:16.979881Z] Loop 1391: Loss: 4.88e-03, Avg Return: 0.439, Regret: 0.3628, Entropy: 0.1872 +[2026-01-29T21:53:18.141244Z] Loop 1392: Loss: 5.30e-03, Avg Return: 0.450, Regret: 0.3628, Entropy: 0.1956 +[2026-01-29T21:53:19.304322Z] Loop 1393: Loss: 4.79e-03, Avg Return: 0.443, Regret: 0.3628, Entropy: 0.1964 +[2026-01-29T21:53:20.466081Z] Loop 1394: Loss: 5.05e-03, Avg Return: 0.441, Regret: 0.3628, Entropy: 0.1983 +[2026-01-29T21:53:21.672773Z] Loop 1395: Loss: 4.74e-03, Avg Return: 0.444, Regret: 0.3627, Entropy: 0.2039 +[2026-01-29T21:53:22.833774Z] Loop 1396: Loss: 4.63e-03, Avg Return: 0.440, Regret: 0.3627, Entropy: 0.1947 +[2026-01-29T21:53:23.995787Z] Loop 1397: Loss: 4.43e-03, Avg Return: 0.439, Regret: 0.3627, Entropy: 0.1975 +[2026-01-29T21:53:25.155282Z] Loop 1398: Loss: 4.61e-03, Avg Return: 0.442, Regret: 0.3627, Entropy: 0.1979 +[2026-01-29T21:53:26.315163Z] Loop 1399: Loss: 3.78e-03, Avg Return: 0.437, Regret: 0.3627, Entropy: 0.1913 +[2026-01-29T21:53:27.520937Z] Loop 1400: Loss: 3.71e-03, Avg Return: 0.440, Regret: 0.3642, Entropy: 0.1907 +[2026-01-29T21:53:28.681621Z] Loop 1401: Loss: 3.89e-03, Avg Return: 0.440, Regret: 0.3642, Entropy: 0.1951 +[2026-01-29T21:53:29.841375Z] Loop 1402: Loss: 3.58e-03, Avg Return: 0.442, Regret: 0.3642, Entropy: 0.1905 +[2026-01-29T21:53:31.001035Z] Loop 1403: Loss: 3.64e-03, Avg Return: 0.434, Regret: 0.3642, Entropy: 0.1892 +[2026-01-29T21:53:32.160214Z] Loop 1404: Loss: 3.48e-03, Avg Return: 0.439, Regret: 0.3642, Entropy: 0.1815 +[2026-01-29T21:53:33.370393Z] Loop 1405: Loss: 3.45e-03, Avg Return: 0.436, Regret: 0.3664, Entropy: 0.1780 +[2026-01-29T21:53:34.531991Z] Loop 1406: Loss: 3.23e-03, Avg Return: 0.439, Regret: 0.3664, Entropy: 0.1756 +[2026-01-29T21:53:35.692125Z] Loop 1407: Loss: 3.43e-03, Avg Return: 0.438, Regret: 0.3664, Entropy: 0.1754 +[2026-01-29T21:53:36.851459Z] Loop 1408: Loss: 3.40e-03, Avg Return: 0.437, Regret: 0.3664, Entropy: 0.1799 +[2026-01-29T21:53:38.010918Z] Loop 1409: Loss: 3.41e-03, Avg Return: 0.437, Regret: 0.3664, Entropy: 0.1838 +[2026-01-29T21:53:39.216559Z] Loop 1410: Loss: 3.27e-03, Avg Return: 0.440, Regret: 0.3656, Entropy: 0.1800 +[2026-01-29T21:53:40.379950Z] Loop 1411: Loss: 3.67e-03, Avg Return: 0.436, Regret: 0.3656, Entropy: 0.1883 +[2026-01-29T21:53:41.539918Z] Loop 1412: Loss: 3.76e-03, Avg Return: 0.434, Regret: 0.3656, Entropy: 0.1909 +[2026-01-29T21:53:42.699517Z] Loop 1413: Loss: 3.98e-03, Avg Return: 0.447, Regret: 0.3656, Entropy: 0.1877 +[2026-01-29T21:53:43.860555Z] Loop 1414: Loss: 4.23e-03, Avg Return: 0.447, Regret: 0.3656, Entropy: 0.1972 +[2026-01-29T21:53:45.070564Z] Loop 1415: Loss: 4.21e-03, Avg Return: 0.444, Regret: 0.3620, Entropy: 0.1997 +[2026-01-29T21:53:46.229930Z] Loop 1416: Loss: 4.40e-03, Avg Return: 0.451, Regret: 0.3620, Entropy: 0.2009 +[2026-01-29T21:53:47.389720Z] Loop 1417: Loss: 4.22e-03, Avg Return: 0.438, Regret: 0.3620, Entropy: 0.1968 +[2026-01-29T21:53:48.549067Z] Loop 1418: Loss: 4.52e-03, Avg Return: 0.444, Regret: 0.3620, Entropy: 0.2090 +[2026-01-29T21:53:49.709357Z] Loop 1419: Loss: 4.64e-03, Avg Return: 0.436, Regret: 0.3620, Entropy: 0.2048 +[2026-01-29T21:53:50.917825Z] Loop 1420: Loss: 4.55e-03, Avg Return: 0.440, Regret: 0.3611, Entropy: 0.2052 +[2026-01-29T21:53:52.078153Z] Loop 1421: Loss: 4.44e-03, Avg Return: 0.439, Regret: 0.3611, Entropy: 0.2019 +[2026-01-29T21:53:53.237178Z] Loop 1422: Loss: 5.05e-03, Avg Return: 0.438, Regret: 0.3611, Entropy: 0.2070 +[2026-01-29T21:53:54.401357Z] Loop 1423: Loss: 4.97e-03, Avg Return: 0.450, Regret: 0.3611, Entropy: 0.2190 +[2026-01-29T21:53:55.562274Z] Loop 1424: Loss: 5.29e-03, Avg Return: 0.436, Regret: 0.3611, Entropy: 0.2181 +[2026-01-29T21:53:56.769320Z] Loop 1425: Loss: 5.30e-03, Avg Return: 0.446, Regret: 0.3617, Entropy: 0.2238 +[2026-01-29T21:53:57.929851Z] Loop 1426: Loss: 5.44e-03, Avg Return: 0.444, Regret: 0.3617, Entropy: 0.2205 +[2026-01-29T21:53:59.089002Z] Loop 1427: Loss: 5.18e-03, Avg Return: 0.438, Regret: 0.3617, Entropy: 0.2181 +[2026-01-29T21:54:00.249556Z] Loop 1428: Loss: 5.22e-03, Avg Return: 0.444, Regret: 0.3617, Entropy: 0.2095 +[2026-01-29T21:54:01.408559Z] Loop 1429: Loss: 5.14e-03, Avg Return: 0.444, Regret: 0.3617, Entropy: 0.2121 +[2026-01-29T21:54:02.615022Z] Loop 1430: Loss: 4.59e-03, Avg Return: 0.442, Regret: 0.3608, Entropy: 0.2163 +[2026-01-29T21:54:03.773919Z] Loop 1431: Loss: 5.08e-03, Avg Return: 0.450, Regret: 0.3608, Entropy: 0.2124 +[2026-01-29T21:54:04.934193Z] Loop 1432: Loss: 4.71e-03, Avg Return: 0.443, Regret: 0.3608, Entropy: 0.2105 +[2026-01-29T21:54:06.093365Z] Loop 1433: Loss: 4.35e-03, Avg Return: 0.445, Regret: 0.3608, Entropy: 0.2044 +[2026-01-29T21:54:07.252639Z] Loop 1434: Loss: 4.28e-03, Avg Return: 0.445, Regret: 0.3608, Entropy: 0.2027 +[2026-01-29T21:54:08.458083Z] Loop 1435: Loss: 4.95e-03, Avg Return: 0.447, Regret: 0.3606, Entropy: 0.2004 +[2026-01-29T21:54:09.618425Z] Loop 1436: Loss: 5.16e-03, Avg Return: 0.449, Regret: 0.3606, Entropy: 0.2073 +[2026-01-29T21:54:10.777684Z] Loop 1437: Loss: 4.47e-03, Avg Return: 0.447, Regret: 0.3606, Entropy: 0.2047 +[2026-01-29T21:54:11.938005Z] Loop 1438: Loss: 4.67e-03, Avg Return: 0.438, Regret: 0.3606, Entropy: 0.2099 +[2026-01-29T21:54:13.097220Z] Loop 1439: Loss: 4.75e-03, Avg Return: 0.447, Regret: 0.3606, Entropy: 0.2034 +[2026-01-29T21:54:14.304106Z] Loop 1440: Loss: 4.49e-03, Avg Return: 0.444, Regret: 0.3606, Entropy: 0.2032 +[2026-01-29T21:54:15.464065Z] Loop 1441: Loss: 4.65e-03, Avg Return: 0.442, Regret: 0.3606, Entropy: 0.2077 +[2026-01-29T21:54:16.625979Z] Loop 1442: Loss: 4.68e-03, Avg Return: 0.441, Regret: 0.3606, Entropy: 0.2094 +[2026-01-29T21:54:17.786291Z] Loop 1443: Loss: 4.69e-03, Avg Return: 0.437, Regret: 0.3606, Entropy: 0.2062 +[2026-01-29T21:54:18.946508Z] Loop 1444: Loss: 4.33e-03, Avg Return: 0.444, Regret: 0.3606, Entropy: 0.1902 +[2026-01-29T21:54:20.152211Z] Loop 1445: Loss: 4.23e-03, Avg Return: 0.446, Regret: 0.3603, Entropy: 0.1964 +[2026-01-29T21:54:21.311450Z] Loop 1446: Loss: 4.10e-03, Avg Return: 0.443, Regret: 0.3603, Entropy: 0.1980 +[2026-01-29T21:54:22.471371Z] Loop 1447: Loss: 4.13e-03, Avg Return: 0.444, Regret: 0.3603, Entropy: 0.1870 +[2026-01-29T21:54:23.630809Z] Loop 1448: Loss: 3.45e-03, Avg Return: 0.442, Regret: 0.3603, Entropy: 0.1807 +[2026-01-29T21:54:24.789408Z] Loop 1449: Loss: 3.92e-03, Avg Return: 0.443, Regret: 0.3603, Entropy: 0.1792 +[2026-01-29T21:54:25.994810Z] Loop 1450: Loss: 3.37e-03, Avg Return: 0.440, Regret: 0.3620, Entropy: 0.1778 +[2026-01-29T21:54:27.158116Z] Loop 1451: Loss: 3.50e-03, Avg Return: 0.440, Regret: 0.3620, Entropy: 0.1769 +[2026-01-29T21:54:28.317387Z] Loop 1452: Loss: 3.51e-03, Avg Return: 0.435, Regret: 0.3620, Entropy: 0.1776 +[2026-01-29T21:54:29.475682Z] Loop 1453: Loss: 4.31e-03, Avg Return: 0.446, Regret: 0.3620, Entropy: 0.1836 +[2026-01-29T21:54:30.635297Z] Loop 1454: Loss: 4.37e-03, Avg Return: 0.445, Regret: 0.3620, Entropy: 0.1951 +[2026-01-29T21:54:31.844679Z] Loop 1455: Loss: 4.45e-03, Avg Return: 0.438, Regret: 0.3600, Entropy: 0.1946 +[2026-01-29T21:54:33.005853Z] Loop 1456: Loss: 4.77e-03, Avg Return: 0.444, Regret: 0.3600, Entropy: 0.1940 +[2026-01-29T21:54:34.164015Z] Loop 1457: Loss: 5.30e-03, Avg Return: 0.437, Regret: 0.3600, Entropy: 0.2052 +[2026-01-29T21:54:35.323478Z] Loop 1458: Loss: 5.32e-03, Avg Return: 0.443, Regret: 0.3600, Entropy: 0.1971 +[2026-01-29T21:54:36.483107Z] Loop 1459: Loss: 4.55e-03, Avg Return: 0.438, Regret: 0.3600, Entropy: 0.1983 +[2026-01-29T21:54:37.687612Z] Loop 1460: Loss: 5.14e-03, Avg Return: 0.442, Regret: 0.3603, Entropy: 0.1932 +[2026-01-29T21:54:38.846141Z] Loop 1461: Loss: 5.13e-03, Avg Return: 0.440, Regret: 0.3603, Entropy: 0.1952 +[2026-01-29T21:54:40.005649Z] Loop 1462: Loss: 5.21e-03, Avg Return: 0.440, Regret: 0.3603, Entropy: 0.1981 +[2026-01-29T21:54:41.164725Z] Loop 1463: Loss: 4.61e-03, Avg Return: 0.440, Regret: 0.3603, Entropy: 0.2008 +[2026-01-29T21:54:42.324472Z] Loop 1464: Loss: 4.27e-03, Avg Return: 0.438, Regret: 0.3603, Entropy: 0.1975 +[2026-01-29T21:54:43.529130Z] Loop 1465: Loss: 4.69e-03, Avg Return: 0.452, Regret: 0.3598, Entropy: 0.1964 +[2026-01-29T21:54:44.689459Z] Loop 1466: Loss: 5.26e-03, Avg Return: 0.451, Regret: 0.3598, Entropy: 0.1965 +[2026-01-29T21:54:45.850094Z] Loop 1467: Loss: 5.14e-03, Avg Return: 0.446, Regret: 0.3598, Entropy: 0.1856 +[2026-01-29T21:54:47.010857Z] Loop 1468: Loss: 5.08e-03, Avg Return: 0.444, Regret: 0.3598, Entropy: 0.1946 +[2026-01-29T21:54:48.170843Z] Loop 1469: Loss: 5.16e-03, Avg Return: 0.441, Regret: 0.3598, Entropy: 0.1920 +[2026-01-29T21:54:49.376756Z] Loop 1470: Loss: 5.22e-03, Avg Return: 0.440, Regret: 0.3623, Entropy: 0.1938 +[2026-01-29T21:54:50.535580Z] Loop 1471: Loss: 5.58e-03, Avg Return: 0.444, Regret: 0.3623, Entropy: 0.1960 +[2026-01-29T21:54:51.694801Z] Loop 1472: Loss: 4.67e-03, Avg Return: 0.448, Regret: 0.3623, Entropy: 0.1986 +[2026-01-29T21:54:52.854218Z] Loop 1473: Loss: 4.36e-03, Avg Return: 0.439, Regret: 0.3623, Entropy: 0.1955 +[2026-01-29T21:54:54.014262Z] Loop 1474: Loss: 4.08e-03, Avg Return: 0.450, Regret: 0.3623, Entropy: 0.1884 +[2026-01-29T21:54:55.220575Z] Loop 1475: Loss: 4.07e-03, Avg Return: 0.448, Regret: 0.3595, Entropy: 0.1960 +[2026-01-29T21:54:56.381523Z] Loop 1476: Loss: 4.21e-03, Avg Return: 0.445, Regret: 0.3595, Entropy: 0.1861 +[2026-01-29T21:54:57.540427Z] Loop 1477: Loss: 3.95e-03, Avg Return: 0.448, Regret: 0.3595, Entropy: 0.1815 +[2026-01-29T21:54:58.702301Z] Loop 1478: Loss: 4.17e-03, Avg Return: 0.444, Regret: 0.3595, Entropy: 0.1847 +[2026-01-29T21:54:59.860895Z] Loop 1479: Loss: 4.02e-03, Avg Return: 0.439, Regret: 0.3595, Entropy: 0.1763 +[2026-01-29T21:55:01.064835Z] Loop 1480: Loss: 4.07e-03, Avg Return: 0.443, Regret: 0.3630, Entropy: 0.1672 +[2026-01-29T21:55:02.223391Z] Loop 1481: Loss: 4.40e-03, Avg Return: 0.441, Regret: 0.3630, Entropy: 0.1709 +[2026-01-29T21:55:03.384826Z] Loop 1482: Loss: 4.39e-03, Avg Return: 0.439, Regret: 0.3630, Entropy: 0.1751 +[2026-01-29T21:55:04.545702Z] Loop 1483: Loss: 4.40e-03, Avg Return: 0.436, Regret: 0.3630, Entropy: 0.1689 +[2026-01-29T21:55:05.705074Z] Loop 1484: Loss: 4.01e-03, Avg Return: 0.438, Regret: 0.3630, Entropy: 0.1713 +[2026-01-29T21:55:06.914077Z] Loop 1485: Loss: 4.76e-03, Avg Return: 0.451, Regret: 0.3620, Entropy: 0.1756 +[2026-01-29T21:55:08.076350Z] Loop 1486: Loss: 4.27e-03, Avg Return: 0.446, Regret: 0.3620, Entropy: 0.1885 +[2026-01-29T21:55:09.237664Z] Loop 1487: Loss: 4.51e-03, Avg Return: 0.448, Regret: 0.3620, Entropy: 0.1951 +[2026-01-29T21:55:10.397137Z] Loop 1488: Loss: 4.48e-03, Avg Return: 0.445, Regret: 0.3620, Entropy: 0.2002 +[2026-01-29T21:55:11.557312Z] Loop 1489: Loss: 4.41e-03, Avg Return: 0.440, Regret: 0.3620, Entropy: 0.2092 +[2026-01-29T21:55:12.762387Z] Loop 1490: Loss: 4.73e-03, Avg Return: 0.442, Regret: 0.3610, Entropy: 0.2077 +[2026-01-29T21:55:13.922273Z] Loop 1491: Loss: 4.89e-03, Avg Return: 0.441, Regret: 0.3610, Entropy: 0.2057 +[2026-01-29T21:55:15.081371Z] Loop 1492: Loss: 4.58e-03, Avg Return: 0.439, Regret: 0.3610, Entropy: 0.2045 +[2026-01-29T21:55:16.241089Z] Loop 1493: Loss: 4.67e-03, Avg Return: 0.445, Regret: 0.3610, Entropy: 0.2027 +[2026-01-29T21:55:17.400115Z] Loop 1494: Loss: 4.80e-03, Avg Return: 0.441, Regret: 0.3610, Entropy: 0.1983 +[2026-01-29T21:55:18.605009Z] Loop 1495: Loss: 5.22e-03, Avg Return: 0.438, Regret: 0.3667, Entropy: 0.1918 +[2026-01-29T21:55:19.763899Z] Loop 1496: Loss: 5.15e-03, Avg Return: 0.438, Regret: 0.3667, Entropy: 0.1946 +[2026-01-29T21:55:20.923870Z] Loop 1497: Loss: 4.96e-03, Avg Return: 0.435, Regret: 0.3667, Entropy: 0.1954 +[2026-01-29T21:55:22.082817Z] Loop 1498: Loss: 4.82e-03, Avg Return: 0.444, Regret: 0.3667, Entropy: 0.1900 +[2026-01-29T21:55:23.243322Z] Loop 1499: Loss: 4.71e-03, Avg Return: 0.443, Regret: 0.3667, Entropy: 0.1898 +[2026-01-29T21:55:24.448429Z] Loop 1500: Loss: 4.82e-03, Avg Return: 0.443, Regret: 0.3604, Entropy: 0.1949 +[2026-01-29T21:55:25.608558Z] Loop 1501: Loss: 4.69e-03, Avg Return: 0.445, Regret: 0.3604, Entropy: 0.1918 +[2026-01-29T21:55:26.767306Z] Loop 1502: Loss: 3.86e-03, Avg Return: 0.445, Regret: 0.3604, Entropy: 0.1792 +[2026-01-29T21:55:27.927112Z] Loop 1503: Loss: 3.63e-03, Avg Return: 0.441, Regret: 0.3604, Entropy: 0.1754 +[2026-01-29T21:55:29.085930Z] Loop 1504: Loss: 3.23e-03, Avg Return: 0.437, Regret: 0.3604, Entropy: 0.1674 +[2026-01-29T21:55:30.290947Z] Loop 1505: Loss: 3.43e-03, Avg Return: 0.448, Regret: 0.3600, Entropy: 0.1589 +[2026-01-29T21:55:31.450671Z] Loop 1506: Loss: 3.02e-03, Avg Return: 0.453, Regret: 0.3600, Entropy: 0.1607 +[2026-01-29T21:55:32.611558Z] Loop 1507: Loss: 3.32e-03, Avg Return: 0.439, Regret: 0.3600, Entropy: 0.1595 +[2026-01-29T21:55:33.770336Z] Loop 1508: Loss: 3.16e-03, Avg Return: 0.442, Regret: 0.3600, Entropy: 0.1516 +[2026-01-29T21:55:34.931167Z] Loop 1509: Loss: 3.06e-03, Avg Return: 0.440, Regret: 0.3600, Entropy: 0.1557 +[2026-01-29T21:55:36.136012Z] Loop 1510: Loss: 3.18e-03, Avg Return: 0.442, Regret: 0.3633, Entropy: 0.1525 +[2026-01-29T21:55:37.296063Z] Loop 1511: Loss: 3.11e-03, Avg Return: 0.439, Regret: 0.3633, Entropy: 0.1586 +[2026-01-29T21:55:38.455071Z] Loop 1512: Loss: 3.36e-03, Avg Return: 0.436, Regret: 0.3633, Entropy: 0.1535 +[2026-01-29T21:55:39.615449Z] Loop 1513: Loss: 3.14e-03, Avg Return: 0.438, Regret: 0.3633, Entropy: 0.1524 +[2026-01-29T21:55:40.774392Z] Loop 1514: Loss: 3.10e-03, Avg Return: 0.448, Regret: 0.3633, Entropy: 0.1484 +[2026-01-29T21:55:41.979023Z] Loop 1515: Loss: 2.91e-03, Avg Return: 0.440, Regret: 0.3619, Entropy: 0.1508 +[2026-01-29T21:55:43.139034Z] Loop 1516: Loss: 2.97e-03, Avg Return: 0.446, Regret: 0.3619, Entropy: 0.1505 +[2026-01-29T21:55:44.299014Z] Loop 1517: Loss: 3.25e-03, Avg Return: 0.446, Regret: 0.3619, Entropy: 0.1539 +[2026-01-29T21:55:45.458528Z] Loop 1518: Loss: 2.99e-03, Avg Return: 0.450, Regret: 0.3619, Entropy: 0.1615 +[2026-01-29T21:55:46.621182Z] Loop 1519: Loss: 3.88e-03, Avg Return: 0.444, Regret: 0.3619, Entropy: 0.1624 +[2026-01-29T21:55:47.825582Z] Loop 1520: Loss: 3.91e-03, Avg Return: 0.444, Regret: 0.3587, Entropy: 0.1649 +[2026-01-29T21:55:48.985519Z] Loop 1521: Loss: 3.66e-03, Avg Return: 0.445, Regret: 0.3587, Entropy: 0.1718 +[2026-01-29T21:55:50.149447Z] Loop 1522: Loss: 4.37e-03, Avg Return: 0.447, Regret: 0.3587, Entropy: 0.1764 +[2026-01-29T21:55:51.309719Z] Loop 1523: Loss: 4.06e-03, Avg Return: 0.445, Regret: 0.3587, Entropy: 0.1778 +[2026-01-29T21:55:52.469354Z] Loop 1524: Loss: 3.90e-03, Avg Return: 0.441, Regret: 0.3587, Entropy: 0.1726 +[2026-01-29T21:55:53.677041Z] Loop 1525: Loss: 4.68e-03, Avg Return: 0.449, Regret: 0.3600, Entropy: 0.1719 +[2026-01-29T21:55:54.835783Z] Loop 1526: Loss: 4.75e-03, Avg Return: 0.448, Regret: 0.3600, Entropy: 0.1708 +[2026-01-29T21:55:55.996734Z] Loop 1527: Loss: 4.71e-03, Avg Return: 0.445, Regret: 0.3600, Entropy: 0.1763 +[2026-01-29T21:55:57.156365Z] Loop 1528: Loss: 4.53e-03, Avg Return: 0.436, Regret: 0.3600, Entropy: 0.1800 +[2026-01-29T21:55:58.315832Z] Loop 1529: Loss: 4.56e-03, Avg Return: 0.441, Regret: 0.3600, Entropy: 0.1849 +[2026-01-29T21:55:59.520840Z] Loop 1530: Loss: 4.02e-03, Avg Return: 0.447, Regret: 0.3587, Entropy: 0.1729 +[2026-01-29T21:56:00.681160Z] Loop 1531: Loss: 3.94e-03, Avg Return: 0.443, Regret: 0.3587, Entropy: 0.1706 +[2026-01-29T21:56:01.840107Z] Loop 1532: Loss: 3.64e-03, Avg Return: 0.450, Regret: 0.3587, Entropy: 0.1652 +[2026-01-29T21:56:02.999582Z] Loop 1533: Loss: 3.68e-03, Avg Return: 0.443, Regret: 0.3587, Entropy: 0.1695 +[2026-01-29T21:56:04.158383Z] Loop 1534: Loss: 3.56e-03, Avg Return: 0.451, Regret: 0.3587, Entropy: 0.1712 +[2026-01-29T21:56:05.363972Z] Loop 1535: Loss: 3.53e-03, Avg Return: 0.451, Regret: 0.3587, Entropy: 0.1597 +[2026-01-29T21:56:06.524765Z] Loop 1536: Loss: 3.32e-03, Avg Return: 0.452, Regret: 0.3587, Entropy: 0.1587 +[2026-01-29T21:56:07.685321Z] Loop 1537: Loss: 3.21e-03, Avg Return: 0.448, Regret: 0.3587, Entropy: 0.1536 +[2026-01-29T21:56:08.843313Z] Loop 1538: Loss: 3.04e-03, Avg Return: 0.443, Regret: 0.3587, Entropy: 0.1482 +[2026-01-29T21:56:10.002344Z] Loop 1539: Loss: 3.15e-03, Avg Return: 0.445, Regret: 0.3587, Entropy: 0.1479 +[2026-01-29T21:56:11.205451Z] Loop 1540: Loss: 3.37e-03, Avg Return: 0.441, Regret: 0.3625, Entropy: 0.1488 +[2026-01-29T21:56:12.366307Z] Loop 1541: Loss: 3.47e-03, Avg Return: 0.442, Regret: 0.3625, Entropy: 0.1571 +[2026-01-29T21:56:13.525459Z] Loop 1542: Loss: 3.62e-03, Avg Return: 0.439, Regret: 0.3625, Entropy: 0.1513 +[2026-01-29T21:56:14.684782Z] Loop 1543: Loss: 3.83e-03, Avg Return: 0.437, Regret: 0.3625, Entropy: 0.1522 +[2026-01-29T21:56:15.843141Z] Loop 1544: Loss: 3.76e-03, Avg Return: 0.440, Regret: 0.3625, Entropy: 0.1516 +[2026-01-29T21:56:17.045890Z] Loop 1545: Loss: 3.30e-03, Avg Return: 0.432, Regret: 0.3666, Entropy: 0.1501 +[2026-01-29T21:56:18.205373Z] Loop 1546: Loss: 3.40e-03, Avg Return: 0.433, Regret: 0.3666, Entropy: 0.1440 +[2026-01-29T21:56:19.365885Z] Loop 1547: Loss: 3.64e-03, Avg Return: 0.441, Regret: 0.3666, Entropy: 0.1500 +[2026-01-29T21:56:20.524584Z] Loop 1548: Loss: 3.56e-03, Avg Return: 0.435, Regret: 0.3666, Entropy: 0.1484 +[2026-01-29T21:56:21.684214Z] Loop 1549: Loss: 3.53e-03, Avg Return: 0.445, Regret: 0.3666, Entropy: 0.1559 +[2026-01-29T21:56:22.888075Z] Loop 1550: Loss: 3.61e-03, Avg Return: 0.442, Regret: 0.3603, Entropy: 0.1608 +[2026-01-29T21:56:24.051286Z] Loop 1551: Loss: 3.24e-03, Avg Return: 0.445, Regret: 0.3603, Entropy: 0.1502 +[2026-01-29T21:56:25.210447Z] Loop 1552: Loss: 3.13e-03, Avg Return: 0.440, Regret: 0.3603, Entropy: 0.1593 +[2026-01-29T21:56:26.369272Z] Loop 1553: Loss: 3.56e-03, Avg Return: 0.446, Regret: 0.3603, Entropy: 0.1648 +[2026-01-29T21:56:27.529074Z] Loop 1554: Loss: 4.04e-03, Avg Return: 0.448, Regret: 0.3603, Entropy: 0.1754 +[2026-01-29T21:56:28.737918Z] Loop 1555: Loss: 4.00e-03, Avg Return: 0.447, Regret: 0.3581, Entropy: 0.1878 +[2026-01-29T21:56:29.899811Z] Loop 1556: Loss: 3.93e-03, Avg Return: 0.443, Regret: 0.3581, Entropy: 0.1768 +[2026-01-29T21:56:31.059765Z] Loop 1557: Loss: 4.19e-03, Avg Return: 0.441, Regret: 0.3581, Entropy: 0.1879 +[2026-01-29T21:56:32.218606Z] Loop 1558: Loss: 4.18e-03, Avg Return: 0.438, Regret: 0.3581, Entropy: 0.1823 +[2026-01-29T21:56:33.379328Z] Loop 1559: Loss: 4.24e-03, Avg Return: 0.440, Regret: 0.3581, Entropy: 0.1833 +[2026-01-29T21:56:34.586639Z] Loop 1560: Loss: 4.15e-03, Avg Return: 0.438, Regret: 0.3617, Entropy: 0.1894 +[2026-01-29T21:56:35.747563Z] Loop 1561: Loss: 3.94e-03, Avg Return: 0.436, Regret: 0.3617, Entropy: 0.1812 +[2026-01-29T21:56:36.907120Z] Loop 1562: Loss: 4.30e-03, Avg Return: 0.442, Regret: 0.3617, Entropy: 0.1806 +[2026-01-29T21:56:38.068357Z] Loop 1563: Loss: 4.40e-03, Avg Return: 0.444, Regret: 0.3617, Entropy: 0.1825 +[2026-01-29T21:56:39.229505Z] Loop 1564: Loss: 4.17e-03, Avg Return: 0.435, Regret: 0.3617, Entropy: 0.1839 +[2026-01-29T21:56:40.435298Z] Loop 1565: Loss: 4.39e-03, Avg Return: 0.447, Regret: 0.3592, Entropy: 0.1851 +[2026-01-29T21:56:41.595267Z] Loop 1566: Loss: 4.05e-03, Avg Return: 0.440, Regret: 0.3592, Entropy: 0.1905 +[2026-01-29T21:56:42.755993Z] Loop 1567: Loss: 4.03e-03, Avg Return: 0.449, Regret: 0.3592, Entropy: 0.1769 +[2026-01-29T21:56:43.917685Z] Loop 1568: Loss: 3.86e-03, Avg Return: 0.442, Regret: 0.3592, Entropy: 0.1771 +[2026-01-29T21:56:45.083441Z] Loop 1569: Loss: 3.70e-03, Avg Return: 0.440, Regret: 0.3592, Entropy: 0.1738 +[2026-01-29T21:56:46.291061Z] Loop 1570: Loss: 3.31e-03, Avg Return: 0.452, Regret: 0.3579, Entropy: 0.1641 +[2026-01-29T21:56:47.450504Z] Loop 1571: Loss: 3.15e-03, Avg Return: 0.446, Regret: 0.3579, Entropy: 0.1717 +[2026-01-29T21:56:48.610836Z] Loop 1572: Loss: 3.33e-03, Avg Return: 0.445, Regret: 0.3579, Entropy: 0.1594 +[2026-01-29T21:56:49.771161Z] Loop 1573: Loss: 3.61e-03, Avg Return: 0.441, Regret: 0.3579, Entropy: 0.1572 +[2026-01-29T21:56:50.932098Z] Loop 1574: Loss: 3.47e-03, Avg Return: 0.442, Regret: 0.3579, Entropy: 0.1631 +[2026-01-29T21:56:52.136991Z] Loop 1575: Loss: 3.82e-03, Avg Return: 0.448, Regret: 0.3592, Entropy: 0.1640 +[2026-01-29T21:56:53.299215Z] Loop 1576: Loss: 3.61e-03, Avg Return: 0.447, Regret: 0.3592, Entropy: 0.1619 +[2026-01-29T21:56:54.460324Z] Loop 1577: Loss: 3.28e-03, Avg Return: 0.448, Regret: 0.3592, Entropy: 0.1625 +[2026-01-29T21:56:55.622507Z] Loop 1578: Loss: 3.42e-03, Avg Return: 0.440, Regret: 0.3592, Entropy: 0.1618 +[2026-01-29T21:56:56.789273Z] Loop 1579: Loss: 2.88e-03, Avg Return: 0.446, Regret: 0.3592, Entropy: 0.1559 +[2026-01-29T21:56:58.002337Z] Loop 1580: Loss: 3.40e-03, Avg Return: 0.446, Regret: 0.3577, Entropy: 0.1569 +[2026-01-29T21:56:59.171004Z] Loop 1581: Loss: 3.29e-03, Avg Return: 0.447, Regret: 0.3577, Entropy: 0.1631 +[2026-01-29T21:57:00.329893Z] Loop 1582: Loss: 3.53e-03, Avg Return: 0.447, Regret: 0.3577, Entropy: 0.1600 +[2026-01-29T21:57:01.490035Z] Loop 1583: Loss: 3.44e-03, Avg Return: 0.450, Regret: 0.3577, Entropy: 0.1631 +[2026-01-29T21:57:02.649299Z] Loop 1584: Loss: 3.49e-03, Avg Return: 0.450, Regret: 0.3577, Entropy: 0.1614 +[2026-01-29T21:57:03.855082Z] Loop 1585: Loss: 3.27e-03, Avg Return: 0.443, Regret: 0.3575, Entropy: 0.1606 +[2026-01-29T21:57:05.019610Z] Loop 1586: Loss: 3.46e-03, Avg Return: 0.447, Regret: 0.3575, Entropy: 0.1609 +[2026-01-29T21:57:06.182551Z] Loop 1587: Loss: 3.42e-03, Avg Return: 0.442, Regret: 0.3575, Entropy: 0.1530 +[2026-01-29T21:57:07.343190Z] Loop 1588: Loss: 3.22e-03, Avg Return: 0.454, Regret: 0.3575, Entropy: 0.1611 +[2026-01-29T21:57:08.504354Z] Loop 1589: Loss: 3.79e-03, Avg Return: 0.448, Regret: 0.3575, Entropy: 0.1667 +[2026-01-29T21:57:09.710670Z] Loop 1590: Loss: 4.32e-03, Avg Return: 0.451, Regret: 0.3575, Entropy: 0.1707 +[2026-01-29T21:57:10.871352Z] Loop 1591: Loss: 4.08e-03, Avg Return: 0.452, Regret: 0.3575, Entropy: 0.1679 +[2026-01-29T21:57:12.030481Z] Loop 1592: Loss: 3.91e-03, Avg Return: 0.452, Regret: 0.3575, Entropy: 0.1644 +[2026-01-29T21:57:13.190907Z] Loop 1593: Loss: 3.44e-03, Avg Return: 0.445, Regret: 0.3575, Entropy: 0.1674 +[2026-01-29T21:57:14.350205Z] Loop 1594: Loss: 3.66e-03, Avg Return: 0.441, Regret: 0.3575, Entropy: 0.1688 +[2026-01-29T21:57:15.554330Z] Loop 1595: Loss: 3.93e-03, Avg Return: 0.445, Regret: 0.3573, Entropy: 0.1697 +[2026-01-29T21:57:16.714452Z] Loop 1596: Loss: 3.48e-03, Avg Return: 0.446, Regret: 0.3573, Entropy: 0.1667 +[2026-01-29T21:57:17.879373Z] Loop 1597: Loss: 3.76e-03, Avg Return: 0.443, Regret: 0.3573, Entropy: 0.1622 +[2026-01-29T21:57:19.041315Z] Loop 1598: Loss: 3.67e-03, Avg Return: 0.449, Regret: 0.3573, Entropy: 0.1653 +[2026-01-29T21:57:20.201702Z] Loop 1599: Loss: 3.86e-03, Avg Return: 0.447, Regret: 0.3573, Entropy: 0.1644 +[2026-01-29T21:57:21.409350Z] Loop 1600: Loss: 3.74e-03, Avg Return: 0.446, Regret: 0.3573, Entropy: 0.1705 +[2026-01-29T21:57:22.570369Z] Loop 1601: Loss: 3.97e-03, Avg Return: 0.449, Regret: 0.3573, Entropy: 0.1659 +[2026-01-29T21:57:23.729315Z] Loop 1602: Loss: 4.31e-03, Avg Return: 0.443, Regret: 0.3573, Entropy: 0.1709 +[2026-01-29T21:57:24.888707Z] Loop 1603: Loss: 3.69e-03, Avg Return: 0.448, Regret: 0.3573, Entropy: 0.1726 +[2026-01-29T21:57:26.048839Z] Loop 1604: Loss: 4.71e-03, Avg Return: 0.447, Regret: 0.3573, Entropy: 0.1595 +[2026-01-29T21:57:27.251778Z] Loop 1605: Loss: 4.27e-03, Avg Return: 0.444, Regret: 0.3603, Entropy: 0.1548 +[2026-01-29T21:57:28.412030Z] Loop 1606: Loss: 4.64e-03, Avg Return: 0.442, Regret: 0.3603, Entropy: 0.1566 +[2026-01-29T21:57:29.572594Z] Loop 1607: Loss: 4.55e-03, Avg Return: 0.442, Regret: 0.3603, Entropy: 0.1563 +[2026-01-29T21:57:30.737119Z] Loop 1608: Loss: 4.61e-03, Avg Return: 0.445, Regret: 0.3603, Entropy: 0.1561 +[2026-01-29T21:57:31.895724Z] Loop 1609: Loss: 4.16e-03, Avg Return: 0.444, Regret: 0.3603, Entropy: 0.1594 +[2026-01-29T21:57:33.098861Z] Loop 1610: Loss: 4.39e-03, Avg Return: 0.439, Regret: 0.3592, Entropy: 0.1557 +[2026-01-29T21:57:34.258396Z] Loop 1611: Loss: 4.02e-03, Avg Return: 0.446, Regret: 0.3592, Entropy: 0.1602 +[2026-01-29T21:57:35.419354Z] Loop 1612: Loss: 4.01e-03, Avg Return: 0.444, Regret: 0.3592, Entropy: 0.1596 +[2026-01-29T21:57:36.578391Z] Loop 1613: Loss: 3.83e-03, Avg Return: 0.445, Regret: 0.3592, Entropy: 0.1611 +[2026-01-29T21:57:37.738701Z] Loop 1614: Loss: 3.05e-03, Avg Return: 0.442, Regret: 0.3592, Entropy: 0.1512 +[2026-01-29T21:57:38.941795Z] Loop 1615: Loss: 2.88e-03, Avg Return: 0.452, Regret: 0.3583, Entropy: 0.1431 +[2026-01-29T21:57:40.102210Z] Loop 1616: Loss: 2.54e-03, Avg Return: 0.440, Regret: 0.3583, Entropy: 0.1329 +[2026-01-29T21:57:41.261643Z] Loop 1617: Loss: 2.14e-03, Avg Return: 0.441, Regret: 0.3583, Entropy: 0.1312 +[2026-01-29T21:57:42.421985Z] Loop 1618: Loss: 2.50e-03, Avg Return: 0.441, Regret: 0.3583, Entropy: 0.1356 +[2026-01-29T21:57:43.581437Z] Loop 1619: Loss: 2.52e-03, Avg Return: 0.442, Regret: 0.3583, Entropy: 0.1335 +[2026-01-29T21:57:44.793666Z] Loop 1620: Loss: 2.05e-03, Avg Return: 0.447, Regret: 0.3602, Entropy: 0.1313 +[2026-01-29T21:57:45.952102Z] Loop 1621: Loss: 2.56e-03, Avg Return: 0.436, Regret: 0.3602, Entropy: 0.1353 +[2026-01-29T21:57:47.112535Z] Loop 1622: Loss: 2.32e-03, Avg Return: 0.446, Regret: 0.3602, Entropy: 0.1284 +[2026-01-29T21:57:48.271848Z] Loop 1623: Loss: 2.00e-03, Avg Return: 0.439, Regret: 0.3602, Entropy: 0.1346 +[2026-01-29T21:57:49.431232Z] Loop 1624: Loss: 2.36e-03, Avg Return: 0.446, Regret: 0.3602, Entropy: 0.1353 +[2026-01-29T21:57:50.634044Z] Loop 1625: Loss: 2.42e-03, Avg Return: 0.447, Regret: 0.3593, Entropy: 0.1331 +[2026-01-29T21:57:51.794244Z] Loop 1626: Loss: 2.95e-03, Avg Return: 0.447, Regret: 0.3593, Entropy: 0.1400 +[2026-01-29T21:57:52.954073Z] Loop 1627: Loss: 2.97e-03, Avg Return: 0.443, Regret: 0.3593, Entropy: 0.1404 +[2026-01-29T21:57:54.115245Z] Loop 1628: Loss: 2.98e-03, Avg Return: 0.450, Regret: 0.3593, Entropy: 0.1455 +[2026-01-29T21:57:55.274474Z] Loop 1629: Loss: 3.07e-03, Avg Return: 0.454, Regret: 0.3593, Entropy: 0.1422 +[2026-01-29T21:57:56.478431Z] Loop 1630: Loss: 2.89e-03, Avg Return: 0.446, Regret: 0.3582, Entropy: 0.1444 +[2026-01-29T21:57:57.640064Z] Loop 1631: Loss: 2.83e-03, Avg Return: 0.448, Regret: 0.3582, Entropy: 0.1426 +[2026-01-29T21:57:58.800409Z] Loop 1632: Loss: 2.82e-03, Avg Return: 0.447, Regret: 0.3582, Entropy: 0.1426 +[2026-01-29T21:57:59.960903Z] Loop 1633: Loss: 2.64e-03, Avg Return: 0.450, Regret: 0.3582, Entropy: 0.1428 +[2026-01-29T21:58:01.122098Z] Loop 1634: Loss: 2.80e-03, Avg Return: 0.449, Regret: 0.3582, Entropy: 0.1504 +[2026-01-29T21:58:02.326814Z] Loop 1635: Loss: 3.02e-03, Avg Return: 0.454, Regret: 0.3576, Entropy: 0.1460 +[2026-01-29T21:58:03.486850Z] Loop 1636: Loss: 3.21e-03, Avg Return: 0.444, Regret: 0.3576, Entropy: 0.1545 +[2026-01-29T21:58:04.646131Z] Loop 1637: Loss: 3.60e-03, Avg Return: 0.446, Regret: 0.3576, Entropy: 0.1594 +[2026-01-29T21:58:05.806262Z] Loop 1638: Loss: 3.48e-03, Avg Return: 0.452, Regret: 0.3576, Entropy: 0.1593 +[2026-01-29T21:58:06.966330Z] Loop 1639: Loss: 3.43e-03, Avg Return: 0.452, Regret: 0.3576, Entropy: 0.1601 +[2026-01-29T21:58:08.170161Z] Loop 1640: Loss: 3.70e-03, Avg Return: 0.450, Regret: 0.3568, Entropy: 0.1710 +[2026-01-29T21:58:09.330661Z] Loop 1641: Loss: 4.34e-03, Avg Return: 0.454, Regret: 0.3568, Entropy: 0.1611 +[2026-01-29T21:58:10.491035Z] Loop 1642: Loss: 4.20e-03, Avg Return: 0.450, Regret: 0.3568, Entropy: 0.1656 +[2026-01-29T21:58:11.650642Z] Loop 1643: Loss: 3.87e-03, Avg Return: 0.442, Regret: 0.3568, Entropy: 0.1688 +[2026-01-29T21:58:12.810449Z] Loop 1644: Loss: 4.03e-03, Avg Return: 0.453, Regret: 0.3568, Entropy: 0.1655 +[2026-01-29T21:58:14.020646Z] Loop 1645: Loss: 3.80e-03, Avg Return: 0.444, Regret: 0.3568, Entropy: 0.1679 +[2026-01-29T21:58:15.185362Z] Loop 1646: Loss: 4.45e-03, Avg Return: 0.451, Regret: 0.3568, Entropy: 0.1628 +[2026-01-29T21:58:16.345130Z] Loop 1647: Loss: 4.13e-03, Avg Return: 0.446, Regret: 0.3568, Entropy: 0.1695 +[2026-01-29T21:58:17.505210Z] Loop 1648: Loss: 3.53e-03, Avg Return: 0.451, Regret: 0.3568, Entropy: 0.1706 +[2026-01-29T21:58:18.666378Z] Loop 1649: Loss: 3.88e-03, Avg Return: 0.445, Regret: 0.3568, Entropy: 0.1634 +[2026-01-29T21:58:19.871775Z] Loop 1650: Loss: 3.22e-03, Avg Return: 0.444, Regret: 0.3568, Entropy: 0.1553 +[2026-01-29T21:58:21.034245Z] Loop 1651: Loss: 2.59e-03, Avg Return: 0.447, Regret: 0.3568, Entropy: 0.1375 +[2026-01-29T21:58:22.194426Z] Loop 1652: Loss: 2.89e-03, Avg Return: 0.445, Regret: 0.3568, Entropy: 0.1438 +[2026-01-29T21:58:23.355290Z] Loop 1653: Loss: 3.46e-03, Avg Return: 0.445, Regret: 0.3568, Entropy: 0.1569 +[2026-01-29T21:58:24.514386Z] Loop 1654: Loss: 3.40e-03, Avg Return: 0.437, Regret: 0.3568, Entropy: 0.1503 +[2026-01-29T21:58:25.721147Z] Loop 1655: Loss: 3.34e-03, Avg Return: 0.445, Regret: 0.3619, Entropy: 0.1456 +[2026-01-29T21:58:26.888204Z] Loop 1656: Loss: 3.22e-03, Avg Return: 0.438, Regret: 0.3619, Entropy: 0.1510 +[2026-01-29T21:58:28.048952Z] Loop 1657: Loss: 3.30e-03, Avg Return: 0.442, Regret: 0.3619, Entropy: 0.1458 +[2026-01-29T21:58:29.209985Z] Loop 1658: Loss: 2.83e-03, Avg Return: 0.446, Regret: 0.3619, Entropy: 0.1366 +[2026-01-29T21:58:30.371734Z] Loop 1659: Loss: 2.54e-03, Avg Return: 0.447, Regret: 0.3619, Entropy: 0.1387 +[2026-01-29T21:58:31.577426Z] Loop 1660: Loss: 2.43e-03, Avg Return: 0.443, Regret: 0.3574, Entropy: 0.1405 +[2026-01-29T21:58:32.738161Z] Loop 1661: Loss: 2.94e-03, Avg Return: 0.452, Regret: 0.3574, Entropy: 0.1506 +[2026-01-29T21:58:33.897786Z] Loop 1662: Loss: 3.66e-03, Avg Return: 0.454, Regret: 0.3574, Entropy: 0.1608 +[2026-01-29T21:58:35.059771Z] Loop 1663: Loss: 3.42e-03, Avg Return: 0.445, Regret: 0.3574, Entropy: 0.1707 +[2026-01-29T21:58:36.220513Z] Loop 1664: Loss: 4.29e-03, Avg Return: 0.452, Regret: 0.3574, Entropy: 0.1750 +[2026-01-29T21:58:37.426637Z] Loop 1665: Loss: 4.71e-03, Avg Return: 0.448, Regret: 0.3563, Entropy: 0.1711 +[2026-01-29T21:58:38.586510Z] Loop 1666: Loss: 4.23e-03, Avg Return: 0.445, Regret: 0.3563, Entropy: 0.1670 +[2026-01-29T21:58:39.746524Z] Loop 1667: Loss: 4.04e-03, Avg Return: 0.446, Regret: 0.3563, Entropy: 0.1597 +[2026-01-29T21:58:40.906174Z] Loop 1668: Loss: 4.33e-03, Avg Return: 0.453, Regret: 0.3563, Entropy: 0.1589 +[2026-01-29T21:58:42.065980Z] Loop 1669: Loss: 4.62e-03, Avg Return: 0.455, Regret: 0.3563, Entropy: 0.1575 +[2026-01-29T21:58:43.270350Z] Loop 1670: Loss: 4.66e-03, Avg Return: 0.444, Regret: 0.3564, Entropy: 0.1572 +[2026-01-29T21:58:44.432144Z] Loop 1671: Loss: 3.93e-03, Avg Return: 0.448, Regret: 0.3564, Entropy: 0.1588 +[2026-01-29T21:58:45.591241Z] Loop 1672: Loss: 3.90e-03, Avg Return: 0.448, Regret: 0.3564, Entropy: 0.1553 +[2026-01-29T21:58:46.750962Z] Loop 1673: Loss: 4.19e-03, Avg Return: 0.450, Regret: 0.3564, Entropy: 0.1639 +[2026-01-29T21:58:47.912196Z] Loop 1674: Loss: 4.37e-03, Avg Return: 0.446, Regret: 0.3564, Entropy: 0.1634 +[2026-01-29T21:58:49.116179Z] Loop 1675: Loss: 4.28e-03, Avg Return: 0.447, Regret: 0.3564, Entropy: 0.1565 +[2026-01-29T21:58:50.275442Z] Loop 1676: Loss: 3.73e-03, Avg Return: 0.446, Regret: 0.3564, Entropy: 0.1516 +[2026-01-29T21:58:51.435465Z] Loop 1677: Loss: 4.16e-03, Avg Return: 0.448, Regret: 0.3564, Entropy: 0.1532 +[2026-01-29T21:58:52.594503Z] Loop 1678: Loss: 4.73e-03, Avg Return: 0.447, Regret: 0.3564, Entropy: 0.1554 +[2026-01-29T21:58:53.754165Z] Loop 1679: Loss: 4.26e-03, Avg Return: 0.451, Regret: 0.3564, Entropy: 0.1535 +[2026-01-29T21:58:54.958447Z] Loop 1680: Loss: 3.91e-03, Avg Return: 0.443, Regret: 0.3565, Entropy: 0.1529 +[2026-01-29T21:58:56.119390Z] Loop 1681: Loss: 4.47e-03, Avg Return: 0.455, Regret: 0.3565, Entropy: 0.1557 +[2026-01-29T21:58:57.279266Z] Loop 1682: Loss: 4.14e-03, Avg Return: 0.446, Regret: 0.3565, Entropy: 0.1498 +[2026-01-29T21:58:58.439456Z] Loop 1683: Loss: 4.48e-03, Avg Return: 0.449, Regret: 0.3565, Entropy: 0.1458 +[2026-01-29T21:58:59.600949Z] Loop 1684: Loss: 4.46e-03, Avg Return: 0.449, Regret: 0.3565, Entropy: 0.1441 +[2026-01-29T21:59:00.806846Z] Loop 1685: Loss: 4.45e-03, Avg Return: 0.447, Regret: 0.3568, Entropy: 0.1516 +[2026-01-29T21:59:01.969311Z] Loop 1686: Loss: 5.06e-03, Avg Return: 0.435, Regret: 0.3568, Entropy: 0.1539 +[2026-01-29T21:59:03.130007Z] Loop 1687: Loss: 5.23e-03, Avg Return: 0.447, Regret: 0.3568, Entropy: 0.1564 +[2026-01-29T21:59:04.291838Z] Loop 1688: Loss: 4.83e-03, Avg Return: 0.443, Regret: 0.3568, Entropy: 0.1487 +[2026-01-29T21:59:05.452622Z] Loop 1689: Loss: 4.66e-03, Avg Return: 0.429, Regret: 0.3568, Entropy: 0.1525 +[2026-01-29T21:59:06.658611Z] Loop 1690: Loss: 4.84e-03, Avg Return: 0.439, Regret: 0.3639, Entropy: 0.1465 +[2026-01-29T21:59:07.821633Z] Loop 1691: Loss: 4.94e-03, Avg Return: 0.444, Regret: 0.3639, Entropy: 0.1488 +[2026-01-29T21:59:08.983170Z] Loop 1692: Loss: 4.67e-03, Avg Return: 0.442, Regret: 0.3639, Entropy: 0.1491 +[2026-01-29T21:59:10.143223Z] Loop 1693: Loss: 4.72e-03, Avg Return: 0.443, Regret: 0.3639, Entropy: 0.1568 +[2026-01-29T21:59:11.304371Z] Loop 1694: Loss: 4.79e-03, Avg Return: 0.451, Regret: 0.3639, Entropy: 0.1551 +[2026-01-29T21:59:12.511472Z] Loop 1695: Loss: 4.54e-03, Avg Return: 0.450, Regret: 0.3560, Entropy: 0.1477 +[2026-01-29T21:59:13.672613Z] Loop 1696: Loss: 3.94e-03, Avg Return: 0.442, Regret: 0.3560, Entropy: 0.1588 +[2026-01-29T21:59:14.832544Z] Loop 1697: Loss: 3.90e-03, Avg Return: 0.444, Regret: 0.3560, Entropy: 0.1626 +[2026-01-29T21:59:15.992450Z] Loop 1698: Loss: 3.58e-03, Avg Return: 0.445, Regret: 0.3560, Entropy: 0.1600 +[2026-01-29T21:59:17.153326Z] Loop 1699: Loss: 3.68e-03, Avg Return: 0.451, Regret: 0.3560, Entropy: 0.1484 +[2026-01-29T21:59:18.361385Z] Loop 1700: Loss: 3.39e-03, Avg Return: 0.442, Regret: 0.3562, Entropy: 0.1595 +[2026-01-29T21:59:19.521823Z] Loop 1701: Loss: 3.41e-03, Avg Return: 0.444, Regret: 0.3562, Entropy: 0.1553 +[2026-01-29T21:59:20.681643Z] Loop 1702: Loss: 3.06e-03, Avg Return: 0.437, Regret: 0.3562, Entropy: 0.1495 +[2026-01-29T21:59:21.841428Z] Loop 1703: Loss: 2.92e-03, Avg Return: 0.446, Regret: 0.3562, Entropy: 0.1397 +[2026-01-29T21:59:23.003370Z] Loop 1704: Loss: 2.75e-03, Avg Return: 0.446, Regret: 0.3562, Entropy: 0.1424 +[2026-01-29T21:59:24.209305Z] Loop 1705: Loss: 2.68e-03, Avg Return: 0.447, Regret: 0.3571, Entropy: 0.1418 +[2026-01-29T21:59:25.371243Z] Loop 1706: Loss: 2.26e-03, Avg Return: 0.451, Regret: 0.3571, Entropy: 0.1376 +[2026-01-29T21:59:26.530674Z] Loop 1707: Loss: 2.45e-03, Avg Return: 0.448, Regret: 0.3571, Entropy: 0.1314 +[2026-01-29T21:59:27.691172Z] Loop 1708: Loss: 2.35e-03, Avg Return: 0.451, Regret: 0.3571, Entropy: 0.1310 +[2026-01-29T21:59:28.852885Z] Loop 1709: Loss: 2.42e-03, Avg Return: 0.449, Regret: 0.3571, Entropy: 0.1283 +[2026-01-29T21:59:30.055789Z] Loop 1710: Loss: 2.18e-03, Avg Return: 0.453, Regret: 0.3578, Entropy: 0.1282 +[2026-01-29T21:59:31.214959Z] Loop 1711: Loss: 2.17e-03, Avg Return: 0.452, Regret: 0.3578, Entropy: 0.1262 +[2026-01-29T21:59:32.375713Z] Loop 1712: Loss: 2.24e-03, Avg Return: 0.442, Regret: 0.3578, Entropy: 0.1335 +[2026-01-29T21:59:33.535930Z] Loop 1713: Loss: 2.12e-03, Avg Return: 0.447, Regret: 0.3578, Entropy: 0.1251 +[2026-01-29T21:59:34.695553Z] Loop 1714: Loss: 1.95e-03, Avg Return: 0.445, Regret: 0.3578, Entropy: 0.1326 +[2026-01-29T21:59:35.900335Z] Loop 1715: Loss: 2.08e-03, Avg Return: 0.443, Regret: 0.3572, Entropy: 0.1324 +[2026-01-29T21:59:37.062028Z] Loop 1716: Loss: 2.35e-03, Avg Return: 0.450, Regret: 0.3572, Entropy: 0.1344 +[2026-01-29T21:59:38.222640Z] Loop 1717: Loss: 2.41e-03, Avg Return: 0.443, Regret: 0.3572, Entropy: 0.1388 +[2026-01-29T21:59:39.383027Z] Loop 1718: Loss: 2.50e-03, Avg Return: 0.445, Regret: 0.3572, Entropy: 0.1425 +[2026-01-29T21:59:40.550344Z] Loop 1719: Loss: 2.48e-03, Avg Return: 0.449, Regret: 0.3572, Entropy: 0.1465 +[2026-01-29T21:59:41.759989Z] Loop 1720: Loss: 2.54e-03, Avg Return: 0.447, Regret: 0.3562, Entropy: 0.1411 +[2026-01-29T21:59:42.922422Z] Loop 1721: Loss: 2.83e-03, Avg Return: 0.449, Regret: 0.3562, Entropy: 0.1455 +[2026-01-29T21:59:44.086325Z] Loop 1722: Loss: 2.48e-03, Avg Return: 0.447, Regret: 0.3562, Entropy: 0.1461 +[2026-01-29T21:59:45.247438Z] Loop 1723: Loss: 2.43e-03, Avg Return: 0.447, Regret: 0.3562, Entropy: 0.1299 +[2026-01-29T21:59:46.408098Z] Loop 1724: Loss: 2.30e-03, Avg Return: 0.452, Regret: 0.3562, Entropy: 0.1353 +[2026-01-29T21:59:47.612752Z] Loop 1725: Loss: 2.10e-03, Avg Return: 0.447, Regret: 0.3568, Entropy: 0.1341 +[2026-01-29T21:59:48.776543Z] Loop 1726: Loss: 2.33e-03, Avg Return: 0.451, Regret: 0.3568, Entropy: 0.1342 +[2026-01-29T21:59:49.936434Z] Loop 1727: Loss: 2.43e-03, Avg Return: 0.446, Regret: 0.3568, Entropy: 0.1434 +[2026-01-29T21:59:51.094759Z] Loop 1728: Loss: 2.08e-03, Avg Return: 0.447, Regret: 0.3568, Entropy: 0.1440 +[2026-01-29T21:59:52.254068Z] Loop 1729: Loss: 2.59e-03, Avg Return: 0.446, Regret: 0.3568, Entropy: 0.1398 +[2026-01-29T21:59:53.461137Z] Loop 1730: Loss: 2.48e-03, Avg Return: 0.447, Regret: 0.3558, Entropy: 0.1349 +[2026-01-29T21:59:54.620474Z] Loop 1731: Loss: 2.43e-03, Avg Return: 0.439, Regret: 0.3558, Entropy: 0.1516 +[2026-01-29T21:59:55.779619Z] Loop 1732: Loss: 3.22e-03, Avg Return: 0.451, Regret: 0.3558, Entropy: 0.1506 +[2026-01-29T21:59:56.939587Z] Loop 1733: Loss: 2.96e-03, Avg Return: 0.444, Regret: 0.3558, Entropy: 0.1510 +[2026-01-29T21:59:58.099885Z] Loop 1734: Loss: 2.72e-03, Avg Return: 0.445, Regret: 0.3558, Entropy: 0.1490 +[2026-01-29T21:59:59.303316Z] Loop 1735: Loss: 2.67e-03, Avg Return: 0.449, Regret: 0.3552, Entropy: 0.1469 +[2026-01-29T22:00:00.462561Z] Loop 1736: Loss: 2.56e-03, Avg Return: 0.455, Regret: 0.3552, Entropy: 0.1466 +[2026-01-29T22:00:01.622094Z] Loop 1737: Loss: 2.39e-03, Avg Return: 0.446, Regret: 0.3552, Entropy: 0.1439 +[2026-01-29T22:00:02.781080Z] Loop 1738: Loss: 2.50e-03, Avg Return: 0.444, Regret: 0.3552, Entropy: 0.1568 +[2026-01-29T22:00:03.941157Z] Loop 1739: Loss: 2.70e-03, Avg Return: 0.455, Regret: 0.3552, Entropy: 0.1487 +[2026-01-29T22:00:05.145121Z] Loop 1740: Loss: 3.13e-03, Avg Return: 0.450, Regret: 0.3545, Entropy: 0.1599 +[2026-01-29T22:00:06.305205Z] Loop 1741: Loss: 2.94e-03, Avg Return: 0.447, Regret: 0.3545, Entropy: 0.1612 +[2026-01-29T22:00:07.464431Z] Loop 1742: Loss: 3.72e-03, Avg Return: 0.441, Regret: 0.3545, Entropy: 0.1698 +[2026-01-29T22:00:08.624204Z] Loop 1743: Loss: 3.69e-03, Avg Return: 0.447, Regret: 0.3545, Entropy: 0.1722 +[2026-01-29T22:00:09.785176Z] Loop 1744: Loss: 3.82e-03, Avg Return: 0.447, Regret: 0.3545, Entropy: 0.1749 +[2026-01-29T22:00:10.988366Z] Loop 1745: Loss: 4.00e-03, Avg Return: 0.456, Regret: 0.3541, Entropy: 0.1765 +[2026-01-29T22:00:12.147054Z] Loop 1746: Loss: 4.77e-03, Avg Return: 0.452, Regret: 0.3541, Entropy: 0.1911 +[2026-01-29T22:00:13.308125Z] Loop 1747: Loss: 4.83e-03, Avg Return: 0.449, Regret: 0.3541, Entropy: 0.2051 +[2026-01-29T22:00:14.468699Z] Loop 1748: Loss: 5.65e-03, Avg Return: 0.448, Regret: 0.3541, Entropy: 0.2092 +[2026-01-29T22:00:15.628995Z] Loop 1749: Loss: 5.98e-03, Avg Return: 0.456, Regret: 0.3541, Entropy: 0.2240 +[2026-01-29T22:00:16.834344Z] Loop 1750: Loss: 6.09e-03, Avg Return: 0.441, Regret: 0.3644, Entropy: 0.2284 +[2026-01-29T22:00:17.994339Z] Loop 1751: Loss: 6.45e-03, Avg Return: 0.439, Regret: 0.3644, Entropy: 0.2269 +[2026-01-29T22:00:19.153891Z] Loop 1752: Loss: 6.51e-03, Avg Return: 0.446, Regret: 0.3644, Entropy: 0.2165 +[2026-01-29T22:00:20.313855Z] Loop 1753: Loss: 5.69e-03, Avg Return: 0.446, Regret: 0.3644, Entropy: 0.2156 +[2026-01-29T22:00:21.475425Z] Loop 1754: Loss: 5.33e-03, Avg Return: 0.446, Regret: 0.3644, Entropy: 0.2088 +[2026-01-29T22:00:22.679585Z] Loop 1755: Loss: 4.60e-03, Avg Return: 0.455, Regret: 0.3544, Entropy: 0.1874 +[2026-01-29T22:00:23.840528Z] Loop 1756: Loss: 3.51e-03, Avg Return: 0.442, Regret: 0.3544, Entropy: 0.1774 +[2026-01-29T22:00:25.001849Z] Loop 1757: Loss: 3.27e-03, Avg Return: 0.449, Regret: 0.3544, Entropy: 0.1593 +[2026-01-29T22:00:26.164904Z] Loop 1758: Loss: 2.77e-03, Avg Return: 0.445, Regret: 0.3544, Entropy: 0.1541 +[2026-01-29T22:00:27.325087Z] Loop 1759: Loss: 2.50e-03, Avg Return: 0.450, Regret: 0.3544, Entropy: 0.1504 +[2026-01-29T22:00:28.531166Z] Loop 1760: Loss: 2.66e-03, Avg Return: 0.443, Regret: 0.3557, Entropy: 0.1431 +[2026-01-29T22:00:29.691820Z] Loop 1761: Loss: 2.50e-03, Avg Return: 0.446, Regret: 0.3557, Entropy: 0.1492 +[2026-01-29T22:00:30.853944Z] Loop 1762: Loss: 2.60e-03, Avg Return: 0.447, Regret: 0.3557, Entropy: 0.1407 +[2026-01-29T22:00:32.015299Z] Loop 1763: Loss: 2.68e-03, Avg Return: 0.441, Regret: 0.3557, Entropy: 0.1473 +[2026-01-29T22:00:33.177354Z] Loop 1764: Loss: 3.15e-03, Avg Return: 0.449, Regret: 0.3557, Entropy: 0.1431 +[2026-01-29T22:00:34.381876Z] Loop 1765: Loss: 2.96e-03, Avg Return: 0.450, Regret: 0.3571, Entropy: 0.1468 +[2026-01-29T22:00:35.543728Z] Loop 1766: Loss: 2.87e-03, Avg Return: 0.453, Regret: 0.3571, Entropy: 0.1462 +[2026-01-29T22:00:36.707756Z] Loop 1767: Loss: 2.74e-03, Avg Return: 0.446, Regret: 0.3571, Entropy: 0.1404 +[2026-01-29T22:00:37.869025Z] Loop 1768: Loss: 2.49e-03, Avg Return: 0.449, Regret: 0.3571, Entropy: 0.1444 +[2026-01-29T22:00:39.028475Z] Loop 1769: Loss: 2.76e-03, Avg Return: 0.450, Regret: 0.3571, Entropy: 0.1560 +[2026-01-29T22:00:40.232637Z] Loop 1770: Loss: 4.06e-03, Avg Return: 0.453, Regret: 0.3538, Entropy: 0.1716 +[2026-01-29T22:00:41.394941Z] Loop 1771: Loss: 4.47e-03, Avg Return: 0.453, Regret: 0.3538, Entropy: 0.1772 +[2026-01-29T22:00:42.556329Z] Loop 1772: Loss: 4.92e-03, Avg Return: 0.447, Regret: 0.3538, Entropy: 0.1811 +[2026-01-29T22:00:43.716060Z] Loop 1773: Loss: 5.41e-03, Avg Return: 0.455, Regret: 0.3538, Entropy: 0.1787 +[2026-01-29T22:00:44.875686Z] Loop 1774: Loss: 4.97e-03, Avg Return: 0.452, Regret: 0.3538, Entropy: 0.1684 +[2026-01-29T22:00:46.084446Z] Loop 1775: Loss: 4.86e-03, Avg Return: 0.446, Regret: 0.3557, Entropy: 0.1678 +[2026-01-29T22:00:47.245181Z] Loop 1776: Loss: 5.11e-03, Avg Return: 0.448, Regret: 0.3557, Entropy: 0.1648 +[2026-01-29T22:00:48.404606Z] Loop 1777: Loss: 4.88e-03, Avg Return: 0.457, Regret: 0.3557, Entropy: 0.1705 +[2026-01-29T22:00:49.565163Z] Loop 1778: Loss: 4.60e-03, Avg Return: 0.448, Regret: 0.3557, Entropy: 0.1673 +[2026-01-29T22:00:50.726342Z] Loop 1779: Loss: 3.62e-03, Avg Return: 0.455, Regret: 0.3557, Entropy: 0.1678 +[2026-01-29T22:00:51.930096Z] Loop 1780: Loss: 3.30e-03, Avg Return: 0.450, Regret: 0.3544, Entropy: 0.1461 +[2026-01-29T22:00:53.088839Z] Loop 1781: Loss: 2.45e-03, Avg Return: 0.448, Regret: 0.3544, Entropy: 0.1393 +[2026-01-29T22:00:54.248709Z] Loop 1782: Loss: 2.13e-03, Avg Return: 0.451, Regret: 0.3544, Entropy: 0.1313 +[2026-01-29T22:00:55.409165Z] Loop 1783: Loss: 1.91e-03, Avg Return: 0.445, Regret: 0.3544, Entropy: 0.1313 +[2026-01-29T22:00:56.569199Z] Loop 1784: Loss: 1.90e-03, Avg Return: 0.450, Regret: 0.3544, Entropy: 0.1271 +[2026-01-29T22:00:57.775160Z] Loop 1785: Loss: 2.14e-03, Avg Return: 0.443, Regret: 0.3578, Entropy: 0.1283 +[2026-01-29T22:00:58.935825Z] Loop 1786: Loss: 2.03e-03, Avg Return: 0.437, Regret: 0.3578, Entropy: 0.1333 +[2026-01-29T22:01:00.094785Z] Loop 1787: Loss: 2.82e-03, Avg Return: 0.450, Regret: 0.3578, Entropy: 0.1349 +[2026-01-29T22:01:01.254794Z] Loop 1788: Loss: 2.26e-03, Avg Return: 0.448, Regret: 0.3578, Entropy: 0.1298 +[2026-01-29T22:01:02.415831Z] Loop 1789: Loss: 1.95e-03, Avg Return: 0.440, Regret: 0.3578, Entropy: 0.1305 +[2026-01-29T22:01:03.619473Z] Loop 1790: Loss: 2.06e-03, Avg Return: 0.454, Regret: 0.3570, Entropy: 0.1257 +[2026-01-29T22:01:04.778766Z] Loop 1791: Loss: 1.94e-03, Avg Return: 0.445, Regret: 0.3570, Entropy: 0.1318 +[2026-01-29T22:01:05.938486Z] Loop 1792: Loss: 2.21e-03, Avg Return: 0.447, Regret: 0.3570, Entropy: 0.1234 +[2026-01-29T22:01:07.097563Z] Loop 1793: Loss: 1.96e-03, Avg Return: 0.447, Regret: 0.3570, Entropy: 0.1259 +[2026-01-29T22:01:08.260251Z] Loop 1794: Loss: 2.17e-03, Avg Return: 0.455, Regret: 0.3570, Entropy: 0.1332 +[2026-01-29T22:01:09.464696Z] Loop 1795: Loss: 2.13e-03, Avg Return: 0.445, Regret: 0.3548, Entropy: 0.1427 +[2026-01-29T22:01:10.627752Z] Loop 1796: Loss: 2.45e-03, Avg Return: 0.448, Regret: 0.3548, Entropy: 0.1416 +[2026-01-29T22:01:11.788317Z] Loop 1797: Loss: 2.02e-03, Avg Return: 0.452, Regret: 0.3548, Entropy: 0.1316 +[2026-01-29T22:01:12.949364Z] Loop 1798: Loss: 2.09e-03, Avg Return: 0.449, Regret: 0.3548, Entropy: 0.1380 +[2026-01-29T22:01:14.111564Z] Loop 1799: Loss: 2.12e-03, Avg Return: 0.459, Regret: 0.3548, Entropy: 0.1319 +[2026-01-29T22:01:15.318538Z] Loop 1800: Loss: 2.28e-03, Avg Return: 0.450, Regret: 0.3548, Entropy: 0.1324 +[2026-01-29T22:01:16.479997Z] Loop 1801: Loss: 2.06e-03, Avg Return: 0.453, Regret: 0.3548, Entropy: 0.1340 +[2026-01-29T22:01:17.640012Z] Loop 1802: Loss: 2.01e-03, Avg Return: 0.450, Regret: 0.3548, Entropy: 0.1385 +[2026-01-29T22:01:18.801775Z] Loop 1803: Loss: 2.43e-03, Avg Return: 0.453, Regret: 0.3548, Entropy: 0.1398 +[2026-01-29T22:01:19.962781Z] Loop 1804: Loss: 2.46e-03, Avg Return: 0.452, Regret: 0.3548, Entropy: 0.1402 +[2026-01-29T22:01:21.167711Z] Loop 1805: Loss: 2.93e-03, Avg Return: 0.453, Regret: 0.3537, Entropy: 0.1540 +[2026-01-29T22:01:22.328278Z] Loop 1806: Loss: 2.95e-03, Avg Return: 0.444, Regret: 0.3537, Entropy: 0.1573 +[2026-01-29T22:01:23.488085Z] Loop 1807: Loss: 3.55e-03, Avg Return: 0.454, Regret: 0.3537, Entropy: 0.1595 +[2026-01-29T22:01:24.647193Z] Loop 1808: Loss: 4.14e-03, Avg Return: 0.451, Regret: 0.3537, Entropy: 0.1710 +[2026-01-29T22:01:25.806980Z] Loop 1809: Loss: 5.04e-03, Avg Return: 0.446, Regret: 0.3537, Entropy: 0.1741 +[2026-01-29T22:01:27.009175Z] Loop 1810: Loss: 5.03e-03, Avg Return: 0.446, Regret: 0.3552, Entropy: 0.1652 +[2026-01-29T22:01:28.169757Z] Loop 1811: Loss: 5.33e-03, Avg Return: 0.458, Regret: 0.3552, Entropy: 0.1629 +[2026-01-29T22:01:29.330308Z] Loop 1812: Loss: 5.62e-03, Avg Return: 0.448, Regret: 0.3552, Entropy: 0.1669 +[2026-01-29T22:01:30.491368Z] Loop 1813: Loss: 5.08e-03, Avg Return: 0.451, Regret: 0.3552, Entropy: 0.1585 +[2026-01-29T22:01:31.651963Z] Loop 1814: Loss: 4.70e-03, Avg Return: 0.452, Regret: 0.3552, Entropy: 0.1604 +[2026-01-29T22:01:32.857480Z] Loop 1815: Loss: 4.71e-03, Avg Return: 0.459, Regret: 0.3534, Entropy: 0.1596 +[2026-01-29T22:01:34.017802Z] Loop 1816: Loss: 4.53e-03, Avg Return: 0.450, Regret: 0.3534, Entropy: 0.1535 +[2026-01-29T22:01:35.182442Z] Loop 1817: Loss: 4.26e-03, Avg Return: 0.452, Regret: 0.3534, Entropy: 0.1512 +[2026-01-29T22:01:36.341260Z] Loop 1818: Loss: 4.42e-03, Avg Return: 0.457, Regret: 0.3534, Entropy: 0.1500 +[2026-01-29T22:01:37.500905Z] Loop 1819: Loss: 4.65e-03, Avg Return: 0.448, Regret: 0.3534, Entropy: 0.1539 +[2026-01-29T22:01:38.707441Z] Loop 1820: Loss: 4.23e-03, Avg Return: 0.456, Regret: 0.3535, Entropy: 0.1464 +[2026-01-29T22:01:39.868047Z] Loop 1821: Loss: 3.49e-03, Avg Return: 0.449, Regret: 0.3535, Entropy: 0.1487 +[2026-01-29T22:01:41.028032Z] Loop 1822: Loss: 3.39e-03, Avg Return: 0.447, Regret: 0.3535, Entropy: 0.1522 +[2026-01-29T22:01:42.188307Z] Loop 1823: Loss: 3.46e-03, Avg Return: 0.450, Regret: 0.3535, Entropy: 0.1479 +[2026-01-29T22:01:43.349794Z] Loop 1824: Loss: 3.06e-03, Avg Return: 0.452, Regret: 0.3535, Entropy: 0.1487 +[2026-01-29T22:01:44.553474Z] Loop 1825: Loss: 3.20e-03, Avg Return: 0.452, Regret: 0.3541, Entropy: 0.1401 +[2026-01-29T22:01:45.712775Z] Loop 1826: Loss: 3.83e-03, Avg Return: 0.453, Regret: 0.3541, Entropy: 0.1525 +[2026-01-29T22:01:46.872448Z] Loop 1827: Loss: 4.05e-03, Avg Return: 0.449, Regret: 0.3541, Entropy: 0.1448 +[2026-01-29T22:01:48.032914Z] Loop 1828: Loss: 3.51e-03, Avg Return: 0.452, Regret: 0.3541, Entropy: 0.1512 +[2026-01-29T22:01:49.192245Z] Loop 1829: Loss: 4.19e-03, Avg Return: 0.442, Regret: 0.3541, Entropy: 0.1492 +[2026-01-29T22:01:50.394549Z] Loop 1830: Loss: 4.07e-03, Avg Return: 0.446, Regret: 0.3536, Entropy: 0.1451 +[2026-01-29T22:01:51.556461Z] Loop 1831: Loss: 4.35e-03, Avg Return: 0.452, Regret: 0.3536, Entropy: 0.1521 +[2026-01-29T22:01:52.715278Z] Loop 1832: Loss: 4.37e-03, Avg Return: 0.454, Regret: 0.3536, Entropy: 0.1416 +[2026-01-29T22:01:53.874768Z] Loop 1833: Loss: 4.44e-03, Avg Return: 0.449, Regret: 0.3536, Entropy: 0.1443 +[2026-01-29T22:01:55.035918Z] Loop 1834: Loss: 4.51e-03, Avg Return: 0.450, Regret: 0.3536, Entropy: 0.1517 +[2026-01-29T22:01:56.242811Z] Loop 1835: Loss: 4.23e-03, Avg Return: 0.451, Regret: 0.3533, Entropy: 0.1457 +[2026-01-29T22:01:57.404271Z] Loop 1836: Loss: 4.03e-03, Avg Return: 0.457, Regret: 0.3533, Entropy: 0.1480 +[2026-01-29T22:01:58.564042Z] Loop 1837: Loss: 4.78e-03, Avg Return: 0.451, Regret: 0.3533, Entropy: 0.1491 +[2026-01-29T22:01:59.726191Z] Loop 1838: Loss: 3.99e-03, Avg Return: 0.448, Regret: 0.3533, Entropy: 0.1495 +[2026-01-29T22:02:00.887501Z] Loop 1839: Loss: 3.92e-03, Avg Return: 0.445, Regret: 0.3533, Entropy: 0.1435 +[2026-01-29T22:02:02.095986Z] Loop 1840: Loss: 3.99e-03, Avg Return: 0.452, Regret: 0.3533, Entropy: 0.1492 +[2026-01-29T22:02:03.256072Z] Loop 1841: Loss: 3.80e-03, Avg Return: 0.450, Regret: 0.3533, Entropy: 0.1509 +[2026-01-29T22:02:04.417340Z] Loop 1842: Loss: 3.68e-03, Avg Return: 0.452, Regret: 0.3533, Entropy: 0.1538 +[2026-01-29T22:02:05.577592Z] Loop 1843: Loss: 3.62e-03, Avg Return: 0.448, Regret: 0.3533, Entropy: 0.1483 +[2026-01-29T22:02:06.737640Z] Loop 1844: Loss: 2.82e-03, Avg Return: 0.452, Regret: 0.3533, Entropy: 0.1427 +[2026-01-29T22:02:07.940922Z] Loop 1845: Loss: 2.52e-03, Avg Return: 0.448, Regret: 0.3542, Entropy: 0.1443 +[2026-01-29T22:02:09.101370Z] Loop 1846: Loss: 2.48e-03, Avg Return: 0.452, Regret: 0.3542, Entropy: 0.1436 +[2026-01-29T22:02:10.260481Z] Loop 1847: Loss: 2.49e-03, Avg Return: 0.452, Regret: 0.3542, Entropy: 0.1344 +[2026-01-29T22:02:11.420330Z] Loop 1848: Loss: 2.01e-03, Avg Return: 0.452, Regret: 0.3542, Entropy: 0.1444 +[2026-01-29T22:02:12.579552Z] Loop 1849: Loss: 2.27e-03, Avg Return: 0.460, Regret: 0.3542, Entropy: 0.1436 +[2026-01-29T22:02:13.782404Z] Loop 1850: Loss: 2.48e-03, Avg Return: 0.447, Regret: 0.3543, Entropy: 0.1463 +[2026-01-29T22:02:14.943403Z] Loop 1851: Loss: 2.55e-03, Avg Return: 0.445, Regret: 0.3543, Entropy: 0.1423 +[2026-01-29T22:02:16.104095Z] Loop 1852: Loss: 2.98e-03, Avg Return: 0.456, Regret: 0.3543, Entropy: 0.1389 +[2026-01-29T22:02:17.263911Z] Loop 1853: Loss: 3.08e-03, Avg Return: 0.453, Regret: 0.3543, Entropy: 0.1425 +[2026-01-29T22:02:18.423407Z] Loop 1854: Loss: 3.67e-03, Avg Return: 0.451, Regret: 0.3543, Entropy: 0.1514 +[2026-01-29T22:02:19.626637Z] Loop 1855: Loss: 3.74e-03, Avg Return: 0.451, Regret: 0.3530, Entropy: 0.1447 +[2026-01-29T22:02:20.789234Z] Loop 1856: Loss: 3.94e-03, Avg Return: 0.449, Regret: 0.3530, Entropy: 0.1520 +[2026-01-29T22:02:21.949116Z] Loop 1857: Loss: 4.50e-03, Avg Return: 0.456, Regret: 0.3530, Entropy: 0.1475 +[2026-01-29T22:02:23.111940Z] Loop 1858: Loss: 4.76e-03, Avg Return: 0.445, Regret: 0.3530, Entropy: 0.1445 +[2026-01-29T22:02:24.271756Z] Loop 1859: Loss: 5.27e-03, Avg Return: 0.446, Regret: 0.3530, Entropy: 0.1516 +[2026-01-29T22:02:25.477180Z] Loop 1860: Loss: 5.26e-03, Avg Return: 0.448, Regret: 0.3537, Entropy: 0.1551 +[2026-01-29T22:02:26.637960Z] Loop 1861: Loss: 4.76e-03, Avg Return: 0.445, Regret: 0.3537, Entropy: 0.1477 +[2026-01-29T22:02:27.798334Z] Loop 1862: Loss: 5.15e-03, Avg Return: 0.452, Regret: 0.3537, Entropy: 0.1522 +[2026-01-29T22:02:28.957723Z] Loop 1863: Loss: 4.73e-03, Avg Return: 0.449, Regret: 0.3537, Entropy: 0.1459 +[2026-01-29T22:02:30.117718Z] Loop 1864: Loss: 4.71e-03, Avg Return: 0.450, Regret: 0.3537, Entropy: 0.1567 +[2026-01-29T22:02:31.320343Z] Loop 1865: Loss: 5.18e-03, Avg Return: 0.447, Regret: 0.3526, Entropy: 0.1491 +[2026-01-29T22:02:32.486311Z] Loop 1866: Loss: 4.82e-03, Avg Return: 0.457, Regret: 0.3526, Entropy: 0.1482 +[2026-01-29T22:02:33.647052Z] Loop 1867: Loss: 4.13e-03, Avg Return: 0.454, Regret: 0.3526, Entropy: 0.1560 +[2026-01-29T22:02:34.807179Z] Loop 1868: Loss: 3.79e-03, Avg Return: 0.453, Regret: 0.3526, Entropy: 0.1554 +[2026-01-29T22:02:35.966402Z] Loop 1869: Loss: 3.40e-03, Avg Return: 0.454, Regret: 0.3526, Entropy: 0.1544 +[2026-01-29T22:02:37.174063Z] Loop 1870: Loss: 3.19e-03, Avg Return: 0.448, Regret: 0.3526, Entropy: 0.1538 +[2026-01-29T22:02:38.333680Z] Loop 1871: Loss: 2.75e-03, Avg Return: 0.451, Regret: 0.3526, Entropy: 0.1529 +[2026-01-29T22:02:39.493645Z] Loop 1872: Loss: 2.78e-03, Avg Return: 0.453, Regret: 0.3526, Entropy: 0.1420 +[2026-01-29T22:02:40.653130Z] Loop 1873: Loss: 2.56e-03, Avg Return: 0.446, Regret: 0.3526, Entropy: 0.1477 +[2026-01-29T22:02:41.812451Z] Loop 1874: Loss: 2.61e-03, Avg Return: 0.448, Regret: 0.3526, Entropy: 0.1511 +[2026-01-29T22:02:43.016260Z] Loop 1875: Loss: 2.77e-03, Avg Return: 0.446, Regret: 0.3524, Entropy: 0.1459 +[2026-01-29T22:02:44.176252Z] Loop 1876: Loss: 3.07e-03, Avg Return: 0.460, Regret: 0.3524, Entropy: 0.1552 +[2026-01-29T22:02:45.335402Z] Loop 1877: Loss: 3.28e-03, Avg Return: 0.448, Regret: 0.3524, Entropy: 0.1502 +[2026-01-29T22:02:46.495128Z] Loop 1878: Loss: 3.79e-03, Avg Return: 0.452, Regret: 0.3524, Entropy: 0.1535 +[2026-01-29T22:02:47.655862Z] Loop 1879: Loss: 3.59e-03, Avg Return: 0.454, Regret: 0.3524, Entropy: 0.1563 +[2026-01-29T22:02:48.859412Z] Loop 1880: Loss: 4.10e-03, Avg Return: 0.443, Regret: 0.3522, Entropy: 0.1694 +[2026-01-29T22:02:50.019325Z] Loop 1881: Loss: 4.35e-03, Avg Return: 0.449, Regret: 0.3522, Entropy: 0.1659 +[2026-01-29T22:02:51.179735Z] Loop 1882: Loss: 5.14e-03, Avg Return: 0.451, Regret: 0.3522, Entropy: 0.1713 +[2026-01-29T22:02:52.339345Z] Loop 1883: Loss: 4.88e-03, Avg Return: 0.446, Regret: 0.3522, Entropy: 0.1725 +[2026-01-29T22:02:53.498870Z] Loop 1884: Loss: 5.58e-03, Avg Return: 0.457, Regret: 0.3522, Entropy: 0.1729 +[2026-01-29T22:02:54.703308Z] Loop 1885: Loss: 5.22e-03, Avg Return: 0.454, Regret: 0.3535, Entropy: 0.1692 +[2026-01-29T22:02:55.863923Z] Loop 1886: Loss: 5.18e-03, Avg Return: 0.459, Regret: 0.3535, Entropy: 0.1632 +[2026-01-29T22:02:57.023903Z] Loop 1887: Loss: 4.33e-03, Avg Return: 0.453, Regret: 0.3535, Entropy: 0.1745 +[2026-01-29T22:02:58.185139Z] Loop 1888: Loss: 4.76e-03, Avg Return: 0.453, Regret: 0.3535, Entropy: 0.1628 +[2026-01-29T22:02:59.346814Z] Loop 1889: Loss: 4.58e-03, Avg Return: 0.453, Regret: 0.3535, Entropy: 0.1626 +[2026-01-29T22:03:00.551121Z] Loop 1890: Loss: 5.32e-03, Avg Return: 0.448, Regret: 0.3530, Entropy: 0.1683 +[2026-01-29T22:03:01.710705Z] Loop 1891: Loss: 4.90e-03, Avg Return: 0.449, Regret: 0.3530, Entropy: 0.1683 +[2026-01-29T22:03:02.872032Z] Loop 1892: Loss: 4.99e-03, Avg Return: 0.442, Regret: 0.3530, Entropy: 0.1725 +[2026-01-29T22:03:04.034496Z] Loop 1893: Loss: 4.76e-03, Avg Return: 0.451, Regret: 0.3530, Entropy: 0.1635 +[2026-01-29T22:03:05.194738Z] Loop 1894: Loss: 4.64e-03, Avg Return: 0.447, Regret: 0.3530, Entropy: 0.1661 +[2026-01-29T22:03:06.414228Z] Loop 1895: Loss: 4.36e-03, Avg Return: 0.449, Regret: 0.3525, Entropy: 0.1637 +[2026-01-29T22:03:07.576343Z] Loop 1896: Loss: 4.76e-03, Avg Return: 0.456, Regret: 0.3525, Entropy: 0.1594 +[2026-01-29T22:03:08.737058Z] Loop 1897: Loss: 4.80e-03, Avg Return: 0.453, Regret: 0.3525, Entropy: 0.1552 +[2026-01-29T22:03:09.896138Z] Loop 1898: Loss: 4.23e-03, Avg Return: 0.454, Regret: 0.3525, Entropy: 0.1578 +[2026-01-29T22:03:11.056631Z] Loop 1899: Loss: 3.79e-03, Avg Return: 0.447, Regret: 0.3525, Entropy: 0.1545 +[2026-01-29T22:03:12.261520Z] Loop 1900: Loss: 3.70e-03, Avg Return: 0.450, Regret: 0.3520, Entropy: 0.1557 +[2026-01-29T22:03:13.423230Z] Loop 1901: Loss: 3.57e-03, Avg Return: 0.454, Regret: 0.3520, Entropy: 0.1521 +[2026-01-29T22:03:14.583561Z] Loop 1902: Loss: 3.22e-03, Avg Return: 0.452, Regret: 0.3520, Entropy: 0.1518 +[2026-01-29T22:03:15.743716Z] Loop 1903: Loss: 2.96e-03, Avg Return: 0.455, Regret: 0.3520, Entropy: 0.1468 +[2026-01-29T22:03:16.904270Z] Loop 1904: Loss: 2.82e-03, Avg Return: 0.458, Regret: 0.3520, Entropy: 0.1411 +[2026-01-29T22:03:18.109362Z] Loop 1905: Loss: 2.52e-03, Avg Return: 0.456, Regret: 0.3526, Entropy: 0.1353 +[2026-01-29T22:03:19.269239Z] Loop 1906: Loss: 2.04e-03, Avg Return: 0.451, Regret: 0.3526, Entropy: 0.1273 +[2026-01-29T22:03:20.428787Z] Loop 1907: Loss: 1.96e-03, Avg Return: 0.447, Regret: 0.3526, Entropy: 0.1262 +[2026-01-29T22:03:21.587766Z] Loop 1908: Loss: 2.04e-03, Avg Return: 0.456, Regret: 0.3526, Entropy: 0.1253 +[2026-01-29T22:03:22.747463Z] Loop 1909: Loss: 2.12e-03, Avg Return: 0.451, Regret: 0.3526, Entropy: 0.1331 +[2026-01-29T22:03:23.953130Z] Loop 1910: Loss: 1.97e-03, Avg Return: 0.441, Regret: 0.3531, Entropy: 0.1336 +[2026-01-29T22:03:25.113859Z] Loop 1911: Loss: 2.11e-03, Avg Return: 0.452, Regret: 0.3531, Entropy: 0.1335 +[2026-01-29T22:03:26.273678Z] Loop 1912: Loss: 2.31e-03, Avg Return: 0.448, Regret: 0.3531, Entropy: 0.1307 +[2026-01-29T22:03:27.434294Z] Loop 1913: Loss: 2.42e-03, Avg Return: 0.449, Regret: 0.3531, Entropy: 0.1319 +[2026-01-29T22:03:28.595958Z] Loop 1914: Loss: 2.31e-03, Avg Return: 0.451, Regret: 0.3531, Entropy: 0.1351 +[2026-01-29T22:03:29.800596Z] Loop 1915: Loss: 2.42e-03, Avg Return: 0.452, Regret: 0.3523, Entropy: 0.1387 +[2026-01-29T22:03:30.966976Z] Loop 1916: Loss: 2.55e-03, Avg Return: 0.455, Regret: 0.3523, Entropy: 0.1425 +[2026-01-29T22:03:32.126945Z] Loop 1917: Loss: 3.02e-03, Avg Return: 0.449, Regret: 0.3523, Entropy: 0.1470 +[2026-01-29T22:03:33.288371Z] Loop 1918: Loss: 3.78e-03, Avg Return: 0.446, Regret: 0.3523, Entropy: 0.1650 +[2026-01-29T22:03:34.448114Z] Loop 1919: Loss: 4.37e-03, Avg Return: 0.453, Regret: 0.3523, Entropy: 0.1778 +[2026-01-29T22:03:35.653509Z] Loop 1920: Loss: 5.07e-03, Avg Return: 0.450, Regret: 0.3556, Entropy: 0.1749 +[2026-01-29T22:03:36.814717Z] Loop 1921: Loss: 5.37e-03, Avg Return: 0.443, Regret: 0.3556, Entropy: 0.1830 +[2026-01-29T22:03:37.975638Z] Loop 1922: Loss: 5.08e-03, Avg Return: 0.437, Regret: 0.3556, Entropy: 0.1720 +[2026-01-29T22:03:39.135172Z] Loop 1923: Loss: 5.00e-03, Avg Return: 0.439, Regret: 0.3556, Entropy: 0.1657 +[2026-01-29T22:03:40.295223Z] Loop 1924: Loss: 5.31e-03, Avg Return: 0.441, Regret: 0.3556, Entropy: 0.1724 +[2026-01-29T22:03:41.500314Z] Loop 1925: Loss: 5.18e-03, Avg Return: 0.456, Regret: 0.3552, Entropy: 0.1578 +[2026-01-29T22:03:42.661213Z] Loop 1926: Loss: 5.42e-03, Avg Return: 0.448, Regret: 0.3552, Entropy: 0.1615 +[2026-01-29T22:03:43.820959Z] Loop 1927: Loss: 4.32e-03, Avg Return: 0.456, Regret: 0.3552, Entropy: 0.1488 +[2026-01-29T22:03:44.982044Z] Loop 1928: Loss: 4.36e-03, Avg Return: 0.449, Regret: 0.3552, Entropy: 0.1479 +[2026-01-29T22:03:46.141834Z] Loop 1929: Loss: 4.40e-03, Avg Return: 0.456, Regret: 0.3552, Entropy: 0.1412 +[2026-01-29T22:03:47.353276Z] Loop 1930: Loss: 3.70e-03, Avg Return: 0.451, Regret: 0.3521, Entropy: 0.1374 +[2026-01-29T22:03:48.512860Z] Loop 1931: Loss: 4.22e-03, Avg Return: 0.449, Regret: 0.3521, Entropy: 0.1325 +[2026-01-29T22:03:49.672808Z] Loop 1932: Loss: 4.01e-03, Avg Return: 0.457, Regret: 0.3521, Entropy: 0.1348 +[2026-01-29T22:03:50.832188Z] Loop 1933: Loss: 4.63e-03, Avg Return: 0.456, Regret: 0.3521, Entropy: 0.1393 +[2026-01-29T22:03:51.992185Z] Loop 1934: Loss: 4.18e-03, Avg Return: 0.456, Regret: 0.3521, Entropy: 0.1318 +[2026-01-29T22:03:53.197300Z] Loop 1935: Loss: 4.00e-03, Avg Return: 0.446, Regret: 0.3526, Entropy: 0.1304 +[2026-01-29T22:03:54.357743Z] Loop 1936: Loss: 4.35e-03, Avg Return: 0.448, Regret: 0.3526, Entropy: 0.1303 +[2026-01-29T22:03:55.517027Z] Loop 1937: Loss: 4.25e-03, Avg Return: 0.451, Regret: 0.3526, Entropy: 0.1301 +[2026-01-29T22:03:56.677366Z] Loop 1938: Loss: 4.74e-03, Avg Return: 0.451, Regret: 0.3526, Entropy: 0.1328 +[2026-01-29T22:03:57.836303Z] Loop 1939: Loss: 4.36e-03, Avg Return: 0.456, Regret: 0.3526, Entropy: 0.1294 +[2026-01-29T22:03:59.039938Z] Loop 1940: Loss: 4.14e-03, Avg Return: 0.445, Regret: 0.3525, Entropy: 0.1350 +[2026-01-29T22:04:00.200331Z] Loop 1941: Loss: 4.02e-03, Avg Return: 0.461, Regret: 0.3525, Entropy: 0.1387 +[2026-01-29T22:04:01.361998Z] Loop 1942: Loss: 3.92e-03, Avg Return: 0.454, Regret: 0.3525, Entropy: 0.1350 +[2026-01-29T22:04:02.521566Z] Loop 1943: Loss: 3.27e-03, Avg Return: 0.448, Regret: 0.3525, Entropy: 0.1449 +[2026-01-29T22:04:03.681850Z] Loop 1944: Loss: 3.53e-03, Avg Return: 0.458, Regret: 0.3525, Entropy: 0.1498 +[2026-01-29T22:04:04.886441Z] Loop 1945: Loss: 3.24e-03, Avg Return: 0.449, Regret: 0.3534, Entropy: 0.1450 +[2026-01-29T22:04:06.047755Z] Loop 1946: Loss: 2.57e-03, Avg Return: 0.447, Regret: 0.3534, Entropy: 0.1412 +[2026-01-29T22:04:07.207193Z] Loop 1947: Loss: 2.50e-03, Avg Return: 0.450, Regret: 0.3534, Entropy: 0.1326 +[2026-01-29T22:04:08.368113Z] Loop 1948: Loss: 2.27e-03, Avg Return: 0.452, Regret: 0.3534, Entropy: 0.1338 +[2026-01-29T22:04:09.529121Z] Loop 1949: Loss: 2.00e-03, Avg Return: 0.451, Regret: 0.3534, Entropy: 0.1371 +[2026-01-29T22:04:10.734586Z] Loop 1950: Loss: 2.24e-03, Avg Return: 0.451, Regret: 0.3541, Entropy: 0.1327 +[2026-01-29T22:04:11.895819Z] Loop 1951: Loss: 2.08e-03, Avg Return: 0.457, Regret: 0.3541, Entropy: 0.1271 +[2026-01-29T22:04:13.058950Z] Loop 1952: Loss: 2.11e-03, Avg Return: 0.455, Regret: 0.3541, Entropy: 0.1283 +[2026-01-29T22:04:14.219566Z] Loop 1953: Loss: 2.10e-03, Avg Return: 0.457, Regret: 0.3541, Entropy: 0.1296 +[2026-01-29T22:04:15.379868Z] Loop 1954: Loss: 1.93e-03, Avg Return: 0.454, Regret: 0.3541, Entropy: 0.1263 +[2026-01-29T22:04:16.585109Z] Loop 1955: Loss: 2.04e-03, Avg Return: 0.443, Regret: 0.3537, Entropy: 0.1279 +[2026-01-29T22:04:17.747471Z] Loop 1956: Loss: 1.70e-03, Avg Return: 0.449, Regret: 0.3537, Entropy: 0.1325 +[2026-01-29T22:04:18.909770Z] Loop 1957: Loss: 1.76e-03, Avg Return: 0.444, Regret: 0.3537, Entropy: 0.1314 +[2026-01-29T22:04:20.068625Z] Loop 1958: Loss: 1.58e-03, Avg Return: 0.445, Regret: 0.3537, Entropy: 0.1257 +[2026-01-29T22:04:21.229122Z] Loop 1959: Loss: 1.86e-03, Avg Return: 0.447, Regret: 0.3537, Entropy: 0.1211 +[2026-01-29T22:04:22.434069Z] Loop 1960: Loss: 1.85e-03, Avg Return: 0.450, Regret: 0.3540, Entropy: 0.1277 +[2026-01-29T22:04:23.595251Z] Loop 1961: Loss: 1.75e-03, Avg Return: 0.451, Regret: 0.3540, Entropy: 0.1241 +[2026-01-29T22:04:24.755331Z] Loop 1962: Loss: 1.78e-03, Avg Return: 0.454, Regret: 0.3540, Entropy: 0.1270 +[2026-01-29T22:04:25.916298Z] Loop 1963: Loss: 1.97e-03, Avg Return: 0.452, Regret: 0.3540, Entropy: 0.1218 +[2026-01-29T22:04:27.076054Z] Loop 1964: Loss: 1.70e-03, Avg Return: 0.441, Regret: 0.3540, Entropy: 0.1194 +[2026-01-29T22:04:28.280618Z] Loop 1965: Loss: 2.04e-03, Avg Return: 0.448, Regret: 0.3527, Entropy: 0.1272 +[2026-01-29T22:04:29.440985Z] Loop 1966: Loss: 2.02e-03, Avg Return: 0.454, Regret: 0.3527, Entropy: 0.1295 +[2026-01-29T22:04:30.603118Z] Loop 1967: Loss: 2.13e-03, Avg Return: 0.459, Regret: 0.3527, Entropy: 0.1258 +[2026-01-29T22:04:31.763746Z] Loop 1968: Loss: 2.14e-03, Avg Return: 0.453, Regret: 0.3527, Entropy: 0.1307 +[2026-01-29T22:04:32.925310Z] Loop 1969: Loss: 2.16e-03, Avg Return: 0.459, Regret: 0.3527, Entropy: 0.1375 +[2026-01-29T22:04:34.134083Z] Loop 1970: Loss: 2.29e-03, Avg Return: 0.443, Regret: 0.3518, Entropy: 0.1363 +[2026-01-29T22:04:35.295848Z] Loop 1971: Loss: 2.57e-03, Avg Return: 0.448, Regret: 0.3518, Entropy: 0.1416 +[2026-01-29T22:04:36.456940Z] Loop 1972: Loss: 3.31e-03, Avg Return: 0.453, Regret: 0.3518, Entropy: 0.1564 +[2026-01-29T22:04:37.617820Z] Loop 1973: Loss: 3.80e-03, Avg Return: 0.449, Regret: 0.3518, Entropy: 0.1584 +[2026-01-29T22:04:38.779202Z] Loop 1974: Loss: 4.12e-03, Avg Return: 0.448, Regret: 0.3518, Entropy: 0.1619 +[2026-01-29T22:04:39.985779Z] Loop 1975: Loss: 4.35e-03, Avg Return: 0.454, Regret: 0.3531, Entropy: 0.1776 +[2026-01-29T22:04:41.147743Z] Loop 1976: Loss: 4.00e-03, Avg Return: 0.451, Regret: 0.3531, Entropy: 0.1719 +[2026-01-29T22:04:42.308864Z] Loop 1977: Loss: 4.11e-03, Avg Return: 0.446, Regret: 0.3531, Entropy: 0.1748 +[2026-01-29T22:04:43.469621Z] Loop 1978: Loss: 4.01e-03, Avg Return: 0.454, Regret: 0.3531, Entropy: 0.1687 +[2026-01-29T22:04:44.631968Z] Loop 1979: Loss: 3.94e-03, Avg Return: 0.450, Regret: 0.3531, Entropy: 0.1602 +[2026-01-29T22:04:45.840286Z] Loop 1980: Loss: 3.66e-03, Avg Return: 0.450, Regret: 0.3521, Entropy: 0.1604 +[2026-01-29T22:04:47.001631Z] Loop 1981: Loss: 3.75e-03, Avg Return: 0.453, Regret: 0.3521, Entropy: 0.1561 +[2026-01-29T22:04:48.162182Z] Loop 1982: Loss: 3.96e-03, Avg Return: 0.459, Regret: 0.3521, Entropy: 0.1523 +[2026-01-29T22:04:49.323539Z] Loop 1983: Loss: 3.58e-03, Avg Return: 0.458, Regret: 0.3521, Entropy: 0.1504 +[2026-01-29T22:04:50.485530Z] Loop 1984: Loss: 3.37e-03, Avg Return: 0.458, Regret: 0.3521, Entropy: 0.1513 +[2026-01-29T22:04:51.694035Z] Loop 1985: Loss: 3.26e-03, Avg Return: 0.455, Regret: 0.3517, Entropy: 0.1494 +[2026-01-29T22:04:52.854478Z] Loop 1986: Loss: 2.72e-03, Avg Return: 0.446, Regret: 0.3517, Entropy: 0.1425 +[2026-01-29T22:04:54.015374Z] Loop 1987: Loss: 2.49e-03, Avg Return: 0.448, Regret: 0.3517, Entropy: 0.1374 +[2026-01-29T22:04:55.176037Z] Loop 1988: Loss: 2.72e-03, Avg Return: 0.451, Regret: 0.3517, Entropy: 0.1368 +[2026-01-29T22:04:56.335715Z] Loop 1989: Loss: 2.86e-03, Avg Return: 0.457, Regret: 0.3517, Entropy: 0.1358 +[2026-01-29T22:04:57.541082Z] Loop 1990: Loss: 2.52e-03, Avg Return: 0.456, Regret: 0.3516, Entropy: 0.1384 +[2026-01-29T22:04:58.701935Z] Loop 1991: Loss: 2.54e-03, Avg Return: 0.452, Regret: 0.3516, Entropy: 0.1314 +[2026-01-29T22:04:59.862001Z] Loop 1992: Loss: 2.09e-03, Avg Return: 0.454, Regret: 0.3516, Entropy: 0.1308 +[2026-01-29T22:05:01.021635Z] Loop 1993: Loss: 1.81e-03, Avg Return: 0.450, Regret: 0.3516, Entropy: 0.1317 +[2026-01-29T22:05:02.182554Z] Loop 1994: Loss: 2.00e-03, Avg Return: 0.454, Regret: 0.3516, Entropy: 0.1213 +[2026-01-29T22:05:03.389223Z] Loop 1995: Loss: 1.88e-03, Avg Return: 0.443, Regret: 0.3520, Entropy: 0.1265 +[2026-01-29T22:05:04.550371Z] Loop 1996: Loss: 2.05e-03, Avg Return: 0.453, Regret: 0.3520, Entropy: 0.1231 +[2026-01-29T22:05:05.710300Z] Loop 1997: Loss: 1.88e-03, Avg Return: 0.459, Regret: 0.3520, Entropy: 0.1172 +[2026-01-29T22:05:06.871058Z] Loop 1998: Loss: 1.97e-03, Avg Return: 0.451, Regret: 0.3520, Entropy: 0.1209 +[2026-01-29T22:05:08.031999Z] Loop 1999: Loss: 2.20e-03, Avg Return: 0.457, Regret: 0.3520, Entropy: 0.1246 +[2026-01-29T22:05:09.236210Z] Loop 2000: Loss: 2.53e-03, Avg Return: 0.450, Regret: 0.3529, Entropy: 0.1314 +[2026-01-29T22:05:10.396233Z] Loop 2001: Loss: 2.48e-03, Avg Return: 0.448, Regret: 0.3529, Entropy: 0.1270 +[2026-01-29T22:05:11.556427Z] Loop 2002: Loss: 2.56e-03, Avg Return: 0.447, Regret: 0.3529, Entropy: 0.1343 +[2026-01-29T22:05:12.717105Z] Loop 2003: Loss: 2.59e-03, Avg Return: 0.451, Regret: 0.3529, Entropy: 0.1318 +[2026-01-29T22:05:13.876615Z] Loop 2004: Loss: 2.40e-03, Avg Return: 0.453, Regret: 0.3529, Entropy: 0.1222 +[2026-01-29T22:05:15.037455Z] Loop 2005: Loss: 2.18e-03, Avg Return: 0.453, Regret: 0.3529, Entropy: 0.1254 +[2026-01-29T22:05:16.197248Z] Loop 2006: Loss: 1.96e-03, Avg Return: 0.459, Regret: 0.3529, Entropy: 0.1224 +[2026-01-29T22:05:17.357333Z] Loop 2007: Loss: 2.08e-03, Avg Return: 0.451, Regret: 0.3529, Entropy: 0.1179 +[2026-01-29T22:05:18.516783Z] Loop 2008: Loss: 2.04e-03, Avg Return: 0.445, Regret: 0.3529, Entropy: 0.1181 +[2026-01-29T22:05:19.676941Z] Loop 2009: Loss: 1.80e-03, Avg Return: 0.456, Regret: 0.3529, Entropy: 0.1192 +[2026-01-29T22:05:20.884975Z] Loop 2010: Loss: 2.00e-03, Avg Return: 0.447, Regret: 0.3515, Entropy: 0.1260 +[2026-01-29T22:05:22.047709Z] Loop 2011: Loss: 2.74e-03, Avg Return: 0.450, Regret: 0.3515, Entropy: 0.1412 +[2026-01-29T22:05:23.208891Z] Loop 2012: Loss: 2.85e-03, Avg Return: 0.459, Regret: 0.3515, Entropy: 0.1363 +[2026-01-29T22:05:24.368794Z] Loop 2013: Loss: 2.95e-03, Avg Return: 0.446, Regret: 0.3515, Entropy: 0.1379 +[2026-01-29T22:05:25.529401Z] Loop 2014: Loss: 3.46e-03, Avg Return: 0.458, Regret: 0.3515, Entropy: 0.1422 +[2026-01-29T22:05:26.694035Z] Loop 2015: Loss: 3.60e-03, Avg Return: 0.454, Regret: 0.3515, Entropy: 0.1434 +[2026-01-29T22:05:27.857582Z] Loop 2016: Loss: 3.05e-03, Avg Return: 0.445, Regret: 0.3515, Entropy: 0.1494 +[2026-01-29T22:05:29.018172Z] Loop 2017: Loss: 2.89e-03, Avg Return: 0.453, Regret: 0.3515, Entropy: 0.1363 +[2026-01-29T22:05:30.178300Z] Loop 2018: Loss: 2.71e-03, Avg Return: 0.453, Regret: 0.3515, Entropy: 0.1344 +[2026-01-29T22:05:31.339536Z] Loop 2019: Loss: 2.33e-03, Avg Return: 0.446, Regret: 0.3515, Entropy: 0.1341 +[2026-01-29T22:05:32.548239Z] Loop 2020: Loss: 2.09e-03, Avg Return: 0.448, Regret: 0.3515, Entropy: 0.1217 +[2026-01-29T22:05:33.709129Z] Loop 2021: Loss: 2.04e-03, Avg Return: 0.447, Regret: 0.3515, Entropy: 0.1199 +[2026-01-29T22:05:34.868726Z] Loop 2022: Loss: 2.04e-03, Avg Return: 0.450, Regret: 0.3515, Entropy: 0.1189 +[2026-01-29T22:05:36.030117Z] Loop 2023: Loss: 1.74e-03, Avg Return: 0.461, Regret: 0.3515, Entropy: 0.1188 +[2026-01-29T22:05:37.193189Z] Loop 2024: Loss: 1.75e-03, Avg Return: 0.458, Regret: 0.3515, Entropy: 0.1147 +[2026-01-29T22:05:38.353462Z] Loop 2025: Loss: 1.61e-03, Avg Return: 0.449, Regret: 0.3515, Entropy: 0.1234 +[2026-01-29T22:05:39.512828Z] Loop 2026: Loss: 1.71e-03, Avg Return: 0.450, Regret: 0.3515, Entropy: 0.1182 +[2026-01-29T22:05:40.672747Z] Loop 2027: Loss: 1.85e-03, Avg Return: 0.450, Regret: 0.3515, Entropy: 0.1179 +[2026-01-29T22:05:41.834961Z] Loop 2028: Loss: 1.80e-03, Avg Return: 0.445, Regret: 0.3515, Entropy: 0.1240 +[2026-01-29T22:05:42.996073Z] Loop 2029: Loss: 2.30e-03, Avg Return: 0.453, Regret: 0.3515, Entropy: 0.1191 +[2026-01-29T22:05:44.203275Z] Loop 2030: Loss: 2.28e-03, Avg Return: 0.450, Regret: 0.3515, Entropy: 0.1256 +[2026-01-29T22:05:45.363285Z] Loop 2031: Loss: 2.19e-03, Avg Return: 0.456, Regret: 0.3515, Entropy: 0.1306 +[2026-01-29T22:05:46.524999Z] Loop 2032: Loss: 2.67e-03, Avg Return: 0.449, Regret: 0.3515, Entropy: 0.1330 +[2026-01-29T22:05:47.685037Z] Loop 2033: Loss: 3.14e-03, Avg Return: 0.452, Regret: 0.3515, Entropy: 0.1344 +[2026-01-29T22:05:48.846629Z] Loop 2034: Loss: 3.06e-03, Avg Return: 0.454, Regret: 0.3515, Entropy: 0.1368 +[2026-01-29T22:05:50.006783Z] Loop 2035: Loss: 3.39e-03, Avg Return: 0.443, Regret: 0.3515, Entropy: 0.1416 +[2026-01-29T22:05:51.167315Z] Loop 2036: Loss: 3.47e-03, Avg Return: 0.448, Regret: 0.3515, Entropy: 0.1372 +[2026-01-29T22:05:52.328630Z] Loop 2037: Loss: 4.34e-03, Avg Return: 0.458, Regret: 0.3515, Entropy: 0.1395 +[2026-01-29T22:05:53.488467Z] Loop 2038: Loss: 4.16e-03, Avg Return: 0.449, Regret: 0.3515, Entropy: 0.1395 +[2026-01-29T22:05:54.649454Z] Loop 2039: Loss: 4.16e-03, Avg Return: 0.451, Regret: 0.3515, Entropy: 0.1400 +[2026-01-29T22:05:55.854996Z] Loop 2040: Loss: 4.34e-03, Avg Return: 0.445, Regret: 0.3533, Entropy: 0.1310 +[2026-01-29T22:05:57.016364Z] Loop 2041: Loss: 4.65e-03, Avg Return: 0.453, Regret: 0.3533, Entropy: 0.1336 +[2026-01-29T22:05:58.177091Z] Loop 2042: Loss: 4.56e-03, Avg Return: 0.454, Regret: 0.3533, Entropy: 0.1283 +[2026-01-29T22:05:59.338015Z] Loop 2043: Loss: 4.44e-03, Avg Return: 0.453, Regret: 0.3533, Entropy: 0.1267 +[2026-01-29T22:06:00.501272Z] Loop 2044: Loss: 4.94e-03, Avg Return: 0.455, Regret: 0.3533, Entropy: 0.1270 +[2026-01-29T22:06:01.663255Z] Loop 2045: Loss: 3.80e-03, Avg Return: 0.445, Regret: 0.3533, Entropy: 0.1226 +[2026-01-29T22:06:02.828420Z] Loop 2046: Loss: 3.75e-03, Avg Return: 0.455, Regret: 0.3533, Entropy: 0.1179 +[2026-01-29T22:06:03.994792Z] Loop 2047: Loss: 3.48e-03, Avg Return: 0.446, Regret: 0.3533, Entropy: 0.1192 +[2026-01-29T22:06:05.156211Z] Loop 2048: Loss: 3.01e-03, Avg Return: 0.462, Regret: 0.3533, Entropy: 0.1233 +[2026-01-29T22:06:06.318512Z] Loop 2049: Loss: 2.79e-03, Avg Return: 0.452, Regret: 0.3533, Entropy: 0.1243 +[2026-01-29T22:06:07.528804Z] Loop 2050: Loss: 2.69e-03, Avg Return: 0.449, Regret: 0.3520, Entropy: 0.1319 +[2026-01-29T22:06:08.690856Z] Loop 2051: Loss: 2.69e-03, Avg Return: 0.450, Regret: 0.3520, Entropy: 0.1270 +[2026-01-29T22:06:09.852342Z] Loop 2052: Loss: 2.36e-03, Avg Return: 0.455, Regret: 0.3520, Entropy: 0.1184 +[2026-01-29T22:06:11.016412Z] Loop 2053: Loss: 1.62e-03, Avg Return: 0.452, Regret: 0.3520, Entropy: 0.1136 +[2026-01-29T22:06:12.182850Z] Loop 2054: Loss: 1.73e-03, Avg Return: 0.454, Regret: 0.3520, Entropy: 0.1081 +[2026-01-29T22:06:13.344948Z] Loop 2055: Loss: 1.53e-03, Avg Return: 0.449, Regret: 0.3520, Entropy: 0.1077 +[2026-01-29T22:06:14.505239Z] Loop 2056: Loss: 1.56e-03, Avg Return: 0.443, Regret: 0.3520, Entropy: 0.1072 +[2026-01-29T22:06:15.666212Z] Loop 2057: Loss: 1.46e-03, Avg Return: 0.451, Regret: 0.3520, Entropy: 0.1091 +[2026-01-29T22:06:16.828336Z] Loop 2058: Loss: 1.58e-03, Avg Return: 0.446, Regret: 0.3520, Entropy: 0.1083 +[2026-01-29T22:06:17.989460Z] Loop 2059: Loss: 1.61e-03, Avg Return: 0.447, Regret: 0.3520, Entropy: 0.1072 +[2026-01-29T22:06:19.206795Z] Loop 2060: Loss: 1.61e-03, Avg Return: 0.451, Regret: 0.3537, Entropy: 0.1053 +[2026-01-29T22:06:20.370033Z] Loop 2061: Loss: 1.77e-03, Avg Return: 0.452, Regret: 0.3537, Entropy: 0.1043 +[2026-01-29T22:06:21.532583Z] Loop 2062: Loss: 1.92e-03, Avg Return: 0.450, Regret: 0.3537, Entropy: 0.1065 +[2026-01-29T22:06:22.694612Z] Loop 2063: Loss: 1.90e-03, Avg Return: 0.448, Regret: 0.3537, Entropy: 0.1147 +[2026-01-29T22:06:23.854727Z] Loop 2064: Loss: 1.90e-03, Avg Return: 0.447, Regret: 0.3537, Entropy: 0.1099 +[2026-01-29T22:06:25.016803Z] Loop 2065: Loss: 2.07e-03, Avg Return: 0.452, Regret: 0.3537, Entropy: 0.1087 +[2026-01-29T22:06:26.181411Z] Loop 2066: Loss: 2.01e-03, Avg Return: 0.448, Regret: 0.3537, Entropy: 0.1172 +[2026-01-29T22:06:27.344852Z] Loop 2067: Loss: 1.92e-03, Avg Return: 0.450, Regret: 0.3537, Entropy: 0.1123 +[2026-01-29T22:06:28.509479Z] Loop 2068: Loss: 1.78e-03, Avg Return: 0.451, Regret: 0.3537, Entropy: 0.1154 +[2026-01-29T22:06:29.670868Z] Loop 2069: Loss: 2.05e-03, Avg Return: 0.454, Regret: 0.3537, Entropy: 0.1103 +[2026-01-29T22:06:30.880492Z] Loop 2070: Loss: 2.00e-03, Avg Return: 0.455, Regret: 0.3520, Entropy: 0.1092 +[2026-01-29T22:06:32.042223Z] Loop 2071: Loss: 2.01e-03, Avg Return: 0.451, Regret: 0.3520, Entropy: 0.1090 +[2026-01-29T22:06:33.204347Z] Loop 2072: Loss: 2.08e-03, Avg Return: 0.453, Regret: 0.3520, Entropy: 0.1175 +[2026-01-29T22:06:34.365330Z] Loop 2073: Loss: 2.02e-03, Avg Return: 0.457, Regret: 0.3520, Entropy: 0.1139 +[2026-01-29T22:06:35.526366Z] Loop 2074: Loss: 2.01e-03, Avg Return: 0.457, Regret: 0.3520, Entropy: 0.1190 +[2026-01-29T22:06:36.686896Z] Loop 2075: Loss: 2.37e-03, Avg Return: 0.457, Regret: 0.3520, Entropy: 0.1179 +[2026-01-29T22:06:37.848363Z] Loop 2076: Loss: 2.35e-03, Avg Return: 0.451, Regret: 0.3520, Entropy: 0.1231 +[2026-01-29T22:06:39.011272Z] Loop 2077: Loss: 2.82e-03, Avg Return: 0.452, Regret: 0.3520, Entropy: 0.1304 +[2026-01-29T22:06:40.172017Z] Loop 2078: Loss: 3.11e-03, Avg Return: 0.454, Regret: 0.3520, Entropy: 0.1367 +[2026-01-29T22:06:41.333349Z] Loop 2079: Loss: 3.35e-03, Avg Return: 0.452, Regret: 0.3520, Entropy: 0.1359 +[2026-01-29T22:06:42.538419Z] Loop 2080: Loss: 3.59e-03, Avg Return: 0.443, Regret: 0.3528, Entropy: 0.1406 +[2026-01-29T22:06:43.701932Z] Loop 2081: Loss: 4.05e-03, Avg Return: 0.447, Regret: 0.3528, Entropy: 0.1388 +[2026-01-29T22:06:44.864469Z] Loop 2082: Loss: 3.59e-03, Avg Return: 0.449, Regret: 0.3528, Entropy: 0.1355 +[2026-01-29T22:06:46.029741Z] Loop 2083: Loss: 3.96e-03, Avg Return: 0.446, Regret: 0.3528, Entropy: 0.1397 +[2026-01-29T22:06:47.199429Z] Loop 2084: Loss: 3.76e-03, Avg Return: 0.447, Regret: 0.3528, Entropy: 0.1337 +[2026-01-29T22:06:48.361213Z] Loop 2085: Loss: 4.02e-03, Avg Return: 0.446, Regret: 0.3528, Entropy: 0.1300 +[2026-01-29T22:06:49.524806Z] Loop 2086: Loss: 3.68e-03, Avg Return: 0.452, Regret: 0.3528, Entropy: 0.1337 +[2026-01-29T22:06:50.686262Z] Loop 2087: Loss: 3.17e-03, Avg Return: 0.456, Regret: 0.3528, Entropy: 0.1349 +[2026-01-29T22:06:51.846753Z] Loop 2088: Loss: 3.12e-03, Avg Return: 0.447, Regret: 0.3528, Entropy: 0.1272 +[2026-01-29T22:06:53.006827Z] Loop 2089: Loss: 3.15e-03, Avg Return: 0.451, Regret: 0.3528, Entropy: 0.1294 +[2026-01-29T22:06:54.213379Z] Loop 2090: Loss: 2.70e-03, Avg Return: 0.448, Regret: 0.3514, Entropy: 0.1262 +[2026-01-29T22:06:55.375418Z] Loop 2091: Loss: 2.53e-03, Avg Return: 0.447, Regret: 0.3514, Entropy: 0.1250 +[2026-01-29T22:06:56.537198Z] Loop 2092: Loss: 2.45e-03, Avg Return: 0.453, Regret: 0.3514, Entropy: 0.1177 +[2026-01-29T22:06:57.700046Z] Loop 2093: Loss: 2.16e-03, Avg Return: 0.452, Regret: 0.3514, Entropy: 0.1161 +[2026-01-29T22:06:58.860635Z] Loop 2094: Loss: 1.85e-03, Avg Return: 0.447, Regret: 0.3514, Entropy: 0.1136 +[2026-01-29T22:07:00.021935Z] Loop 2095: Loss: 1.94e-03, Avg Return: 0.454, Regret: 0.3514, Entropy: 0.1117 +[2026-01-29T22:07:01.185692Z] Loop 2096: Loss: 1.91e-03, Avg Return: 0.451, Regret: 0.3514, Entropy: 0.1052 +[2026-01-29T22:07:02.345001Z] Loop 2097: Loss: 1.45e-03, Avg Return: 0.446, Regret: 0.3514, Entropy: 0.1032 +[2026-01-29T22:07:03.510609Z] Loop 2098: Loss: 1.80e-03, Avg Return: 0.458, Regret: 0.3514, Entropy: 0.1036 +[2026-01-29T22:07:04.671494Z] Loop 2099: Loss: 1.68e-03, Avg Return: 0.446, Regret: 0.3514, Entropy: 0.1124 +[2026-01-29T22:07:05.882390Z] Loop 2100: Loss: 2.20e-03, Avg Return: 0.449, Regret: 0.3544, Entropy: 0.1099 +[2026-01-29T22:07:07.043794Z] Loop 2101: Loss: 2.52e-03, Avg Return: 0.450, Regret: 0.3544, Entropy: 0.1165 +[2026-01-29T22:07:08.204808Z] Loop 2102: Loss: 2.89e-03, Avg Return: 0.447, Regret: 0.3544, Entropy: 0.1253 +[2026-01-29T22:07:09.367112Z] Loop 2103: Loss: 3.23e-03, Avg Return: 0.442, Regret: 0.3544, Entropy: 0.1349 +[2026-01-29T22:07:10.528677Z] Loop 2104: Loss: 3.19e-03, Avg Return: 0.447, Regret: 0.3544, Entropy: 0.1306 +[2026-01-29T22:07:11.690720Z] Loop 2105: Loss: 3.36e-03, Avg Return: 0.446, Regret: 0.3544, Entropy: 0.1320 +[2026-01-29T22:07:12.850961Z] Loop 2106: Loss: 2.74e-03, Avg Return: 0.445, Regret: 0.3544, Entropy: 0.1320 +[2026-01-29T22:07:14.011820Z] Loop 2107: Loss: 2.80e-03, Avg Return: 0.450, Regret: 0.3544, Entropy: 0.1217 +[2026-01-29T22:07:15.171899Z] Loop 2108: Loss: 2.57e-03, Avg Return: 0.452, Regret: 0.3544, Entropy: 0.1155 +[2026-01-29T22:07:16.332860Z] Loop 2109: Loss: 1.79e-03, Avg Return: 0.455, Regret: 0.3544, Entropy: 0.1091 +[2026-01-29T22:07:17.545633Z] Loop 2110: Loss: 1.79e-03, Avg Return: 0.446, Regret: 0.3527, Entropy: 0.1111 +[2026-01-29T22:07:18.708488Z] Loop 2111: Loss: 1.83e-03, Avg Return: 0.445, Regret: 0.3527, Entropy: 0.1096 +[2026-01-29T22:07:19.870629Z] Loop 2112: Loss: 2.31e-03, Avg Return: 0.450, Regret: 0.3527, Entropy: 0.1162 +[2026-01-29T22:07:21.031942Z] Loop 2113: Loss: 2.82e-03, Avg Return: 0.455, Regret: 0.3527, Entropy: 0.1238 +[2026-01-29T22:07:22.192943Z] Loop 2114: Loss: 2.35e-03, Avg Return: 0.453, Regret: 0.3527, Entropy: 0.1226 +[2026-01-29T22:07:23.357396Z] Loop 2115: Loss: 2.69e-03, Avg Return: 0.450, Regret: 0.3527, Entropy: 0.1186 +[2026-01-29T22:07:24.517789Z] Loop 2116: Loss: 2.96e-03, Avg Return: 0.448, Regret: 0.3527, Entropy: 0.1165 +[2026-01-29T22:07:25.679290Z] Loop 2117: Loss: 3.55e-03, Avg Return: 0.448, Regret: 0.3527, Entropy: 0.1129 +[2026-01-29T22:07:26.839199Z] Loop 2118: Loss: 4.38e-03, Avg Return: 0.450, Regret: 0.3527, Entropy: 0.1216 +[2026-01-29T22:07:27.999897Z] Loop 2119: Loss: 4.16e-03, Avg Return: 0.449, Regret: 0.3527, Entropy: 0.1204 +[2026-01-29T22:07:29.213374Z] Loop 2120: Loss: 4.13e-03, Avg Return: 0.438, Regret: 0.3562, Entropy: 0.1207 +[2026-01-29T22:07:30.374951Z] Loop 2121: Loss: 3.81e-03, Avg Return: 0.449, Regret: 0.3562, Entropy: 0.1167 +[2026-01-29T22:07:31.535468Z] Loop 2122: Loss: 3.40e-03, Avg Return: 0.446, Regret: 0.3562, Entropy: 0.1168 +[2026-01-29T22:07:32.696183Z] Loop 2123: Loss: 3.17e-03, Avg Return: 0.454, Regret: 0.3562, Entropy: 0.1085 +[2026-01-29T22:07:33.856105Z] Loop 2124: Loss: 3.01e-03, Avg Return: 0.456, Regret: 0.3562, Entropy: 0.1131 +[2026-01-29T22:07:35.017299Z] Loop 2125: Loss: 2.74e-03, Avg Return: 0.449, Regret: 0.3562, Entropy: 0.1124 +[2026-01-29T22:07:36.179345Z] Loop 2126: Loss: 2.50e-03, Avg Return: 0.449, Regret: 0.3562, Entropy: 0.1178 +[2026-01-29T22:07:37.339222Z] Loop 2127: Loss: 2.58e-03, Avg Return: 0.447, Regret: 0.3562, Entropy: 0.1182 +[2026-01-29T22:07:38.501042Z] Loop 2128: Loss: 2.74e-03, Avg Return: 0.451, Regret: 0.3562, Entropy: 0.1199 +[2026-01-29T22:07:39.661214Z] Loop 2129: Loss: 2.76e-03, Avg Return: 0.451, Regret: 0.3562, Entropy: 0.1217 +[2026-01-29T22:07:40.869409Z] Loop 2130: Loss: 2.58e-03, Avg Return: 0.452, Regret: 0.3516, Entropy: 0.1154 +[2026-01-29T22:07:42.032727Z] Loop 2131: Loss: 2.40e-03, Avg Return: 0.450, Regret: 0.3516, Entropy: 0.1240 +[2026-01-29T22:07:43.192881Z] Loop 2132: Loss: 2.40e-03, Avg Return: 0.454, Regret: 0.3516, Entropy: 0.1194 +[2026-01-29T22:07:44.352400Z] Loop 2133: Loss: 2.24e-03, Avg Return: 0.459, Regret: 0.3516, Entropy: 0.1133 +[2026-01-29T22:07:45.512666Z] Loop 2134: Loss: 2.42e-03, Avg Return: 0.447, Regret: 0.3516, Entropy: 0.1189 +[2026-01-29T22:07:46.673934Z] Loop 2135: Loss: 2.45e-03, Avg Return: 0.454, Regret: 0.3516, Entropy: 0.1211 +[2026-01-29T22:07:47.834911Z] Loop 2136: Loss: 2.73e-03, Avg Return: 0.447, Regret: 0.3516, Entropy: 0.1262 +[2026-01-29T22:07:48.996922Z] Loop 2137: Loss: 2.58e-03, Avg Return: 0.449, Regret: 0.3516, Entropy: 0.1264 +[2026-01-29T22:07:50.157876Z] Loop 2138: Loss: 2.77e-03, Avg Return: 0.457, Regret: 0.3516, Entropy: 0.1142 +[2026-01-29T22:07:51.319650Z] Loop 2139: Loss: 2.57e-03, Avg Return: 0.455, Regret: 0.3516, Entropy: 0.1207 +[2026-01-29T22:07:52.533092Z] Loop 2140: Loss: 2.77e-03, Avg Return: 0.458, Regret: 0.3515, Entropy: 0.1186 +[2026-01-29T22:07:53.697867Z] Loop 2141: Loss: 2.75e-03, Avg Return: 0.452, Regret: 0.3515, Entropy: 0.1196 +[2026-01-29T22:07:54.859415Z] Loop 2142: Loss: 2.81e-03, Avg Return: 0.455, Regret: 0.3515, Entropy: 0.1170 +[2026-01-29T22:07:56.021353Z] Loop 2143: Loss: 2.85e-03, Avg Return: 0.461, Regret: 0.3515, Entropy: 0.1171 +[2026-01-29T22:07:57.184418Z] Loop 2144: Loss: 2.77e-03, Avg Return: 0.451, Regret: 0.3515, Entropy: 0.1178 +[2026-01-29T22:07:58.345400Z] Loop 2145: Loss: 2.56e-03, Avg Return: 0.451, Regret: 0.3515, Entropy: 0.1214 +[2026-01-29T22:07:59.506348Z] Loop 2146: Loss: 2.89e-03, Avg Return: 0.456, Regret: 0.3515, Entropy: 0.1177 +[2026-01-29T22:08:00.667781Z] Loop 2147: Loss: 2.74e-03, Avg Return: 0.453, Regret: 0.3515, Entropy: 0.1162 +[2026-01-29T22:08:01.828054Z] Loop 2148: Loss: 2.89e-03, Avg Return: 0.455, Regret: 0.3515, Entropy: 0.1215 +[2026-01-29T22:08:02.990305Z] Loop 2149: Loss: 2.85e-03, Avg Return: 0.456, Regret: 0.3515, Entropy: 0.1180 +[2026-01-29T22:08:04.198947Z] Loop 2150: Loss: 2.67e-03, Avg Return: 0.455, Regret: 0.3514, Entropy: 0.1216 +[2026-01-29T22:08:05.360538Z] Loop 2151: Loss: 2.70e-03, Avg Return: 0.460, Regret: 0.3514, Entropy: 0.1159 +[2026-01-29T22:08:06.521047Z] Loop 2152: Loss: 2.25e-03, Avg Return: 0.451, Regret: 0.3514, Entropy: 0.1152 +[2026-01-29T22:08:07.682955Z] Loop 2153: Loss: 2.07e-03, Avg Return: 0.458, Regret: 0.3514, Entropy: 0.1174 +[2026-01-29T22:08:08.842759Z] Loop 2154: Loss: 2.15e-03, Avg Return: 0.453, Regret: 0.3514, Entropy: 0.1150 +[2026-01-29T22:08:10.002001Z] Loop 2155: Loss: 2.31e-03, Avg Return: 0.452, Regret: 0.3514, Entropy: 0.1110 +[2026-01-29T22:08:11.160952Z] Loop 2156: Loss: 2.68e-03, Avg Return: 0.449, Regret: 0.3514, Entropy: 0.1200 +[2026-01-29T22:08:12.320350Z] Loop 2157: Loss: 2.48e-03, Avg Return: 0.444, Regret: 0.3514, Entropy: 0.1231 +[2026-01-29T22:08:13.480842Z] Loop 2158: Loss: 2.58e-03, Avg Return: 0.450, Regret: 0.3514, Entropy: 0.1200 +[2026-01-29T22:08:14.640375Z] Loop 2159: Loss: 2.49e-03, Avg Return: 0.445, Regret: 0.3514, Entropy: 0.1199 +[2026-01-29T22:08:15.844698Z] Loop 2160: Loss: 2.57e-03, Avg Return: 0.454, Regret: 0.3515, Entropy: 0.1137 +[2026-01-29T22:08:17.005454Z] Loop 2161: Loss: 2.55e-03, Avg Return: 0.451, Regret: 0.3515, Entropy: 0.1174 +[2026-01-29T22:08:18.166585Z] Loop 2162: Loss: 2.47e-03, Avg Return: 0.451, Regret: 0.3515, Entropy: 0.1153 +[2026-01-29T22:08:19.325281Z] Loop 2163: Loss: 2.32e-03, Avg Return: 0.450, Regret: 0.3515, Entropy: 0.1202 +[2026-01-29T22:08:20.485448Z] Loop 2164: Loss: 2.61e-03, Avg Return: 0.455, Regret: 0.3515, Entropy: 0.1157 +[2026-01-29T22:08:21.645362Z] Loop 2165: Loss: 2.69e-03, Avg Return: 0.448, Regret: 0.3515, Entropy: 0.1185 +[2026-01-29T22:08:22.805077Z] Loop 2166: Loss: 2.85e-03, Avg Return: 0.450, Regret: 0.3515, Entropy: 0.1169 +[2026-01-29T22:08:23.966916Z] Loop 2167: Loss: 2.63e-03, Avg Return: 0.449, Regret: 0.3515, Entropy: 0.1108 +[2026-01-29T22:08:25.126122Z] Loop 2168: Loss: 3.05e-03, Avg Return: 0.451, Regret: 0.3515, Entropy: 0.1180 +[2026-01-29T22:08:26.287754Z] Loop 2169: Loss: 2.85e-03, Avg Return: 0.456, Regret: 0.3515, Entropy: 0.1164 +[2026-01-29T22:08:27.495326Z] Loop 2170: Loss: 2.93e-03, Avg Return: 0.450, Regret: 0.3518, Entropy: 0.1170 +[2026-01-29T22:08:28.659390Z] Loop 2171: Loss: 3.06e-03, Avg Return: 0.456, Regret: 0.3518, Entropy: 0.1145 +[2026-01-29T22:08:29.819465Z] Loop 2172: Loss: 2.96e-03, Avg Return: 0.443, Regret: 0.3518, Entropy: 0.1184 +[2026-01-29T22:08:30.989145Z] Loop 2173: Loss: 3.25e-03, Avg Return: 0.461, Regret: 0.3518, Entropy: 0.1111 +[2026-01-29T22:08:32.156103Z] Loop 2174: Loss: 3.28e-03, Avg Return: 0.447, Regret: 0.3518, Entropy: 0.1173 +[2026-01-29T22:08:33.323301Z] Loop 2175: Loss: 3.23e-03, Avg Return: 0.456, Regret: 0.3518, Entropy: 0.1107 +[2026-01-29T22:08:34.485572Z] Loop 2176: Loss: 3.14e-03, Avg Return: 0.459, Regret: 0.3518, Entropy: 0.1179 +[2026-01-29T22:08:35.645570Z] Loop 2177: Loss: 2.91e-03, Avg Return: 0.445, Regret: 0.3518, Entropy: 0.1111 +[2026-01-29T22:08:36.806437Z] Loop 2178: Loss: 3.25e-03, Avg Return: 0.449, Regret: 0.3518, Entropy: 0.1197 +[2026-01-29T22:08:37.967904Z] Loop 2179: Loss: 3.52e-03, Avg Return: 0.455, Regret: 0.3518, Entropy: 0.1245 +[2026-01-29T22:08:39.193411Z] Loop 2180: Loss: 3.03e-03, Avg Return: 0.448, Regret: 0.3523, Entropy: 0.1171 +[2026-01-29T22:08:40.359055Z] Loop 2181: Loss: 2.88e-03, Avg Return: 0.452, Regret: 0.3523, Entropy: 0.1206 +[2026-01-29T22:08:41.521074Z] Loop 2182: Loss: 3.15e-03, Avg Return: 0.454, Regret: 0.3523, Entropy: 0.1197 +[2026-01-29T22:08:42.683518Z] Loop 2183: Loss: 2.86e-03, Avg Return: 0.459, Regret: 0.3523, Entropy: 0.1200 +[2026-01-29T22:08:43.849855Z] Loop 2184: Loss: 3.10e-03, Avg Return: 0.451, Regret: 0.3523, Entropy: 0.1147 +[2026-01-29T22:08:45.010984Z] Loop 2185: Loss: 2.73e-03, Avg Return: 0.449, Regret: 0.3523, Entropy: 0.1269 +[2026-01-29T22:08:46.171337Z] Loop 2186: Loss: 2.71e-03, Avg Return: 0.452, Regret: 0.3523, Entropy: 0.1209 +[2026-01-29T22:08:47.330769Z] Loop 2187: Loss: 2.33e-03, Avg Return: 0.452, Regret: 0.3523, Entropy: 0.1162 +[2026-01-29T22:08:48.491837Z] Loop 2188: Loss: 2.31e-03, Avg Return: 0.453, Regret: 0.3523, Entropy: 0.1210 +[2026-01-29T22:08:49.653179Z] Loop 2189: Loss: 2.50e-03, Avg Return: 0.451, Regret: 0.3523, Entropy: 0.1174 +[2026-01-29T22:08:50.867998Z] Loop 2190: Loss: 2.63e-03, Avg Return: 0.455, Regret: 0.3514, Entropy: 0.1178 +[2026-01-29T22:08:52.032198Z] Loop 2191: Loss: 2.29e-03, Avg Return: 0.449, Regret: 0.3514, Entropy: 0.1137 +[2026-01-29T22:08:53.192657Z] Loop 2192: Loss: 2.27e-03, Avg Return: 0.446, Regret: 0.3514, Entropy: 0.1119 +[2026-01-29T22:08:54.354261Z] Loop 2193: Loss: 2.10e-03, Avg Return: 0.451, Regret: 0.3514, Entropy: 0.1016 +[2026-01-29T22:08:55.514493Z] Loop 2194: Loss: 1.88e-03, Avg Return: 0.451, Regret: 0.3514, Entropy: 0.1057 +[2026-01-29T22:08:56.674663Z] Loop 2195: Loss: 1.87e-03, Avg Return: 0.446, Regret: 0.3514, Entropy: 0.1080 +[2026-01-29T22:08:57.836798Z] Loop 2196: Loss: 2.12e-03, Avg Return: 0.458, Regret: 0.3514, Entropy: 0.1049 +[2026-01-29T22:08:58.997040Z] Loop 2197: Loss: 2.43e-03, Avg Return: 0.448, Regret: 0.3514, Entropy: 0.1074 +[2026-01-29T22:09:00.158971Z] Loop 2198: Loss: 2.52e-03, Avg Return: 0.451, Regret: 0.3514, Entropy: 0.1108 +[2026-01-29T22:09:01.320823Z] Loop 2199: Loss: 2.78e-03, Avg Return: 0.449, Regret: 0.3514, Entropy: 0.1172 +[2026-01-29T22:09:02.533686Z] Loop 2200: Loss: 2.72e-03, Avg Return: 0.451, Regret: 0.3536, Entropy: 0.1113 +[2026-01-29T22:09:03.696655Z] Loop 2201: Loss: 2.99e-03, Avg Return: 0.449, Regret: 0.3536, Entropy: 0.1167 +[2026-01-29T22:09:04.859408Z] Loop 2202: Loss: 2.65e-03, Avg Return: 0.448, Regret: 0.3536, Entropy: 0.1170 +[2026-01-29T22:09:06.026570Z] Loop 2203: Loss: 2.52e-03, Avg Return: 0.454, Regret: 0.3536, Entropy: 0.1118 +[2026-01-29T22:09:07.187242Z] Loop 2204: Loss: 2.56e-03, Avg Return: 0.450, Regret: 0.3536, Entropy: 0.1118 +[2026-01-29T22:09:08.348827Z] Loop 2205: Loss: 2.43e-03, Avg Return: 0.447, Regret: 0.3536, Entropy: 0.1123 +[2026-01-29T22:09:09.508774Z] Loop 2206: Loss: 2.75e-03, Avg Return: 0.457, Regret: 0.3536, Entropy: 0.1155 +[2026-01-29T22:09:10.670398Z] Loop 2207: Loss: 3.13e-03, Avg Return: 0.453, Regret: 0.3536, Entropy: 0.1132 +[2026-01-29T22:09:11.832301Z] Loop 2208: Loss: 3.05e-03, Avg Return: 0.452, Regret: 0.3536, Entropy: 0.1136 +[2026-01-29T22:09:12.993655Z] Loop 2209: Loss: 2.67e-03, Avg Return: 0.448, Regret: 0.3536, Entropy: 0.1161 +[2026-01-29T22:09:14.202196Z] Loop 2210: Loss: 2.22e-03, Avg Return: 0.454, Regret: 0.3517, Entropy: 0.1116 +[2026-01-29T22:09:15.363977Z] Loop 2211: Loss: 2.07e-03, Avg Return: 0.447, Regret: 0.3517, Entropy: 0.1044 +[2026-01-29T22:09:16.525611Z] Loop 2212: Loss: 1.97e-03, Avg Return: 0.453, Regret: 0.3517, Entropy: 0.1072 +[2026-01-29T22:09:17.685748Z] Loop 2213: Loss: 1.90e-03, Avg Return: 0.451, Regret: 0.3517, Entropy: 0.1125 +[2026-01-29T22:09:18.847119Z] Loop 2214: Loss: 2.25e-03, Avg Return: 0.455, Regret: 0.3517, Entropy: 0.1109 +[2026-01-29T22:09:20.012809Z] Loop 2215: Loss: 2.53e-03, Avg Return: 0.455, Regret: 0.3517, Entropy: 0.1240 +[2026-01-29T22:09:21.174239Z] Loop 2216: Loss: 2.75e-03, Avg Return: 0.454, Regret: 0.3517, Entropy: 0.1272 +[2026-01-29T22:09:22.335556Z] Loop 2217: Loss: 2.88e-03, Avg Return: 0.450, Regret: 0.3517, Entropy: 0.1301 +[2026-01-29T22:09:23.496329Z] Loop 2218: Loss: 2.98e-03, Avg Return: 0.446, Regret: 0.3517, Entropy: 0.1296 +[2026-01-29T22:09:24.659902Z] Loop 2219: Loss: 3.64e-03, Avg Return: 0.462, Regret: 0.3517, Entropy: 0.1309 +[2026-01-29T22:09:25.869115Z] Loop 2220: Loss: 3.44e-03, Avg Return: 0.448, Regret: 0.3527, Entropy: 0.1293 +[2026-01-29T22:09:27.032052Z] Loop 2221: Loss: 3.10e-03, Avg Return: 0.445, Regret: 0.3527, Entropy: 0.1243 +[2026-01-29T22:09:28.193844Z] Loop 2222: Loss: 3.35e-03, Avg Return: 0.449, Regret: 0.3527, Entropy: 0.1241 +[2026-01-29T22:09:29.354214Z] Loop 2223: Loss: 3.50e-03, Avg Return: 0.454, Regret: 0.3527, Entropy: 0.1187 +[2026-01-29T22:09:30.514934Z] Loop 2224: Loss: 3.14e-03, Avg Return: 0.453, Regret: 0.3527, Entropy: 0.1219 +[2026-01-29T22:09:31.676442Z] Loop 2225: Loss: 2.63e-03, Avg Return: 0.451, Regret: 0.3527, Entropy: 0.1224 +[2026-01-29T22:09:32.837704Z] Loop 2226: Loss: 2.77e-03, Avg Return: 0.451, Regret: 0.3527, Entropy: 0.1255 +[2026-01-29T22:09:33.998638Z] Loop 2227: Loss: 2.83e-03, Avg Return: 0.456, Regret: 0.3527, Entropy: 0.1226 +[2026-01-29T22:09:35.159368Z] Loop 2228: Loss: 2.97e-03, Avg Return: 0.454, Regret: 0.3527, Entropy: 0.1248 +[2026-01-29T22:09:36.319447Z] Loop 2229: Loss: 2.52e-03, Avg Return: 0.449, Regret: 0.3527, Entropy: 0.1257 +[2026-01-29T22:09:37.529218Z] Loop 2230: Loss: 3.00e-03, Avg Return: 0.451, Regret: 0.3516, Entropy: 0.1234 +[2026-01-29T22:09:38.695472Z] Loop 2231: Loss: 2.62e-03, Avg Return: 0.451, Regret: 0.3516, Entropy: 0.1241 +[2026-01-29T22:09:39.856095Z] Loop 2232: Loss: 2.94e-03, Avg Return: 0.447, Regret: 0.3516, Entropy: 0.1309 +[2026-01-29T22:09:41.017785Z] Loop 2233: Loss: 2.47e-03, Avg Return: 0.453, Regret: 0.3516, Entropy: 0.1236 +[2026-01-29T22:09:42.178516Z] Loop 2234: Loss: 2.90e-03, Avg Return: 0.456, Regret: 0.3516, Entropy: 0.1246 +[2026-01-29T22:09:43.340944Z] Loop 2235: Loss: 2.72e-03, Avg Return: 0.452, Regret: 0.3516, Entropy: 0.1229 +[2026-01-29T22:09:44.500867Z] Loop 2236: Loss: 2.70e-03, Avg Return: 0.454, Regret: 0.3516, Entropy: 0.1169 +[2026-01-29T22:09:45.662243Z] Loop 2237: Loss: 2.79e-03, Avg Return: 0.451, Regret: 0.3516, Entropy: 0.1198 +[2026-01-29T22:09:46.827861Z] Loop 2238: Loss: 2.30e-03, Avg Return: 0.450, Regret: 0.3516, Entropy: 0.1199 +[2026-01-29T22:09:47.989151Z] Loop 2239: Loss: 2.04e-03, Avg Return: 0.454, Regret: 0.3516, Entropy: 0.1150 +[2026-01-29T22:09:49.201462Z] Loop 2240: Loss: 1.98e-03, Avg Return: 0.446, Regret: 0.3513, Entropy: 0.1067 +[2026-01-29T22:09:50.362484Z] Loop 2241: Loss: 2.10e-03, Avg Return: 0.447, Regret: 0.3513, Entropy: 0.1117 +[2026-01-29T22:09:51.523955Z] Loop 2242: Loss: 1.78e-03, Avg Return: 0.444, Regret: 0.3513, Entropy: 0.1111 +[2026-01-29T22:09:52.685933Z] Loop 2243: Loss: 1.95e-03, Avg Return: 0.459, Regret: 0.3513, Entropy: 0.1070 +[2026-01-29T22:09:53.848537Z] Loop 2244: Loss: 2.25e-03, Avg Return: 0.444, Regret: 0.3513, Entropy: 0.1129 +[2026-01-29T22:09:55.011516Z] Loop 2245: Loss: 2.44e-03, Avg Return: 0.453, Regret: 0.3513, Entropy: 0.1183 +[2026-01-29T22:09:56.173014Z] Loop 2246: Loss: 2.36e-03, Avg Return: 0.455, Regret: 0.3513, Entropy: 0.1169 +[2026-01-29T22:09:57.335331Z] Loop 2247: Loss: 2.60e-03, Avg Return: 0.453, Regret: 0.3513, Entropy: 0.1196 +[2026-01-29T22:09:58.496062Z] Loop 2248: Loss: 2.45e-03, Avg Return: 0.447, Regret: 0.3513, Entropy: 0.1161 +[2026-01-29T22:09:59.657063Z] Loop 2249: Loss: 2.42e-03, Avg Return: 0.450, Regret: 0.3513, Entropy: 0.1183 +[2026-01-29T22:10:00.864304Z] Loop 2250: Loss: 2.73e-03, Avg Return: 0.444, Regret: 0.3518, Entropy: 0.1184 +[2026-01-29T22:10:02.024691Z] Loop 2251: Loss: 2.53e-03, Avg Return: 0.452, Regret: 0.3518, Entropy: 0.1170 +[2026-01-29T22:10:03.184045Z] Loop 2252: Loss: 2.70e-03, Avg Return: 0.458, Regret: 0.3518, Entropy: 0.1142 +[2026-01-29T22:10:04.343704Z] Loop 2253: Loss: 2.88e-03, Avg Return: 0.456, Regret: 0.3518, Entropy: 0.1135 +[2026-01-29T22:10:05.503816Z] Loop 2254: Loss: 3.12e-03, Avg Return: 0.456, Regret: 0.3518, Entropy: 0.1149 +[2026-01-29T22:10:06.663365Z] Loop 2255: Loss: 2.84e-03, Avg Return: 0.457, Regret: 0.3518, Entropy: 0.1251 +[2026-01-29T22:10:07.823860Z] Loop 2256: Loss: 2.44e-03, Avg Return: 0.455, Regret: 0.3518, Entropy: 0.1151 +[2026-01-29T22:10:08.982758Z] Loop 2257: Loss: 2.42e-03, Avg Return: 0.450, Regret: 0.3518, Entropy: 0.1126 +[2026-01-29T22:10:10.144188Z] Loop 2258: Loss: 2.44e-03, Avg Return: 0.457, Regret: 0.3518, Entropy: 0.1093 +[2026-01-29T22:10:11.303472Z] Loop 2259: Loss: 2.29e-03, Avg Return: 0.452, Regret: 0.3518, Entropy: 0.1162 +[2026-01-29T22:10:12.507833Z] Loop 2260: Loss: 2.68e-03, Avg Return: 0.458, Regret: 0.3512, Entropy: 0.1155 +[2026-01-29T22:10:13.669416Z] Loop 2261: Loss: 2.20e-03, Avg Return: 0.453, Regret: 0.3512, Entropy: 0.1100 +[2026-01-29T22:10:14.830349Z] Loop 2262: Loss: 2.02e-03, Avg Return: 0.454, Regret: 0.3512, Entropy: 0.1056 +[2026-01-29T22:10:15.989037Z] Loop 2263: Loss: 1.91e-03, Avg Return: 0.446, Regret: 0.3512, Entropy: 0.1034 +[2026-01-29T22:10:17.148437Z] Loop 2264: Loss: 1.71e-03, Avg Return: 0.454, Regret: 0.3512, Entropy: 0.1099 +[2026-01-29T22:10:18.308897Z] Loop 2265: Loss: 2.26e-03, Avg Return: 0.450, Regret: 0.3512, Entropy: 0.1090 +[2026-01-29T22:10:19.469015Z] Loop 2266: Loss: 2.96e-03, Avg Return: 0.458, Regret: 0.3512, Entropy: 0.1176 +[2026-01-29T22:10:20.631442Z] Loop 2267: Loss: 2.49e-03, Avg Return: 0.449, Regret: 0.3512, Entropy: 0.1192 +[2026-01-29T22:10:21.791449Z] Loop 2268: Loss: 2.96e-03, Avg Return: 0.449, Regret: 0.3512, Entropy: 0.1153 +[2026-01-29T22:10:22.951329Z] Loop 2269: Loss: 2.75e-03, Avg Return: 0.453, Regret: 0.3512, Entropy: 0.1218 +[2026-01-29T22:10:24.157154Z] Loop 2270: Loss: 2.83e-03, Avg Return: 0.441, Regret: 0.3533, Entropy: 0.1249 +[2026-01-29T22:10:25.317509Z] Loop 2271: Loss: 2.67e-03, Avg Return: 0.450, Regret: 0.3533, Entropy: 0.1166 +[2026-01-29T22:10:26.476249Z] Loop 2272: Loss: 2.90e-03, Avg Return: 0.460, Regret: 0.3533, Entropy: 0.1164 +[2026-01-29T22:10:27.635955Z] Loop 2273: Loss: 2.91e-03, Avg Return: 0.452, Regret: 0.3533, Entropy: 0.1194 +[2026-01-29T22:10:28.795235Z] Loop 2274: Loss: 2.64e-03, Avg Return: 0.449, Regret: 0.3533, Entropy: 0.1153 +[2026-01-29T22:10:29.956820Z] Loop 2275: Loss: 2.50e-03, Avg Return: 0.447, Regret: 0.3533, Entropy: 0.1190 +[2026-01-29T22:10:31.120824Z] Loop 2276: Loss: 2.26e-03, Avg Return: 0.457, Regret: 0.3533, Entropy: 0.1135 +[2026-01-29T22:10:32.280098Z] Loop 2277: Loss: 2.61e-03, Avg Return: 0.455, Regret: 0.3533, Entropy: 0.1142 +[2026-01-29T22:10:33.442489Z] Loop 2278: Loss: 2.58e-03, Avg Return: 0.448, Regret: 0.3533, Entropy: 0.1096 +[2026-01-29T22:10:34.608111Z] Loop 2279: Loss: 2.82e-03, Avg Return: 0.458, Regret: 0.3533, Entropy: 0.1128 +[2026-01-29T22:10:35.825793Z] Loop 2280: Loss: 2.68e-03, Avg Return: 0.460, Regret: 0.3518, Entropy: 0.1133 +[2026-01-29T22:10:36.996628Z] Loop 2281: Loss: 2.48e-03, Avg Return: 0.453, Regret: 0.3518, Entropy: 0.1112 +[2026-01-29T22:10:38.155806Z] Loop 2282: Loss: 2.62e-03, Avg Return: 0.447, Regret: 0.3518, Entropy: 0.1111 +[2026-01-29T22:10:39.317393Z] Loop 2283: Loss: 2.47e-03, Avg Return: 0.449, Regret: 0.3518, Entropy: 0.1184 +[2026-01-29T22:10:40.478209Z] Loop 2284: Loss: 2.09e-03, Avg Return: 0.450, Regret: 0.3518, Entropy: 0.1117 +[2026-01-29T22:10:41.639403Z] Loop 2285: Loss: 2.22e-03, Avg Return: 0.459, Regret: 0.3518, Entropy: 0.1066 +[2026-01-29T22:10:42.800936Z] Loop 2286: Loss: 2.27e-03, Avg Return: 0.453, Regret: 0.3518, Entropy: 0.1131 +[2026-01-29T22:10:43.961107Z] Loop 2287: Loss: 1.87e-03, Avg Return: 0.456, Regret: 0.3518, Entropy: 0.1114 +[2026-01-29T22:10:45.122040Z] Loop 2288: Loss: 2.02e-03, Avg Return: 0.450, Regret: 0.3518, Entropy: 0.1074 +[2026-01-29T22:10:46.281878Z] Loop 2289: Loss: 2.20e-03, Avg Return: 0.451, Regret: 0.3518, Entropy: 0.1197 +[2026-01-29T22:10:47.488289Z] Loop 2290: Loss: 2.45e-03, Avg Return: 0.449, Regret: 0.3511, Entropy: 0.1201 +[2026-01-29T22:10:48.647811Z] Loop 2291: Loss: 2.73e-03, Avg Return: 0.447, Regret: 0.3511, Entropy: 0.1192 +[2026-01-29T22:10:49.809423Z] Loop 2292: Loss: 2.78e-03, Avg Return: 0.456, Regret: 0.3511, Entropy: 0.1205 +[2026-01-29T22:10:50.970284Z] Loop 2293: Loss: 2.62e-03, Avg Return: 0.446, Regret: 0.3511, Entropy: 0.1231 +[2026-01-29T22:10:52.131955Z] Loop 2294: Loss: 2.80e-03, Avg Return: 0.453, Regret: 0.3511, Entropy: 0.1193 +[2026-01-29T22:10:53.293937Z] Loop 2295: Loss: 2.71e-03, Avg Return: 0.457, Regret: 0.3511, Entropy: 0.1191 +[2026-01-29T22:10:54.454081Z] Loop 2296: Loss: 3.16e-03, Avg Return: 0.450, Regret: 0.3511, Entropy: 0.1205 +[2026-01-29T22:10:55.614692Z] Loop 2297: Loss: 3.29e-03, Avg Return: 0.452, Regret: 0.3511, Entropy: 0.1204 +[2026-01-29T22:10:56.774645Z] Loop 2298: Loss: 3.29e-03, Avg Return: 0.449, Regret: 0.3511, Entropy: 0.1169 +[2026-01-29T22:10:57.934558Z] Loop 2299: Loss: 3.70e-03, Avg Return: 0.458, Regret: 0.3511, Entropy: 0.1125 +[2026-01-29T22:10:59.140534Z] Loop 2300: Loss: 3.69e-03, Avg Return: 0.445, Regret: 0.3546, Entropy: 0.1172 +[2026-01-29T22:11:00.310654Z] Loop 2301: Loss: 3.60e-03, Avg Return: 0.450, Regret: 0.3546, Entropy: 0.1165 +[2026-01-29T22:11:01.473315Z] Loop 2302: Loss: 3.61e-03, Avg Return: 0.449, Regret: 0.3546, Entropy: 0.1127 +[2026-01-29T22:11:02.633757Z] Loop 2303: Loss: 3.94e-03, Avg Return: 0.453, Regret: 0.3546, Entropy: 0.1086 +[2026-01-29T22:11:03.795084Z] Loop 2304: Loss: 3.74e-03, Avg Return: 0.445, Regret: 0.3546, Entropy: 0.1104 +[2026-01-29T22:11:04.955415Z] Loop 2305: Loss: 3.93e-03, Avg Return: 0.444, Regret: 0.3546, Entropy: 0.1104 +[2026-01-29T22:11:06.120407Z] Loop 2306: Loss: 3.81e-03, Avg Return: 0.451, Regret: 0.3546, Entropy: 0.1059 +[2026-01-29T22:11:07.286998Z] Loop 2307: Loss: 3.75e-03, Avg Return: 0.454, Regret: 0.3546, Entropy: 0.1107 +[2026-01-29T22:11:08.448664Z] Loop 2308: Loss: 3.31e-03, Avg Return: 0.447, Regret: 0.3546, Entropy: 0.1092 +[2026-01-29T22:11:09.610001Z] Loop 2309: Loss: 3.16e-03, Avg Return: 0.449, Regret: 0.3546, Entropy: 0.1036 +[2026-01-29T22:11:10.818240Z] Loop 2310: Loss: 2.89e-03, Avg Return: 0.452, Regret: 0.3525, Entropy: 0.1072 +[2026-01-29T22:11:11.985653Z] Loop 2311: Loss: 3.07e-03, Avg Return: 0.457, Regret: 0.3525, Entropy: 0.1031 +[2026-01-29T22:11:13.146326Z] Loop 2312: Loss: 2.77e-03, Avg Return: 0.454, Regret: 0.3525, Entropy: 0.1047 +[2026-01-29T22:11:14.312878Z] Loop 2313: Loss: 2.18e-03, Avg Return: 0.444, Regret: 0.3525, Entropy: 0.1038 +[2026-01-29T22:11:15.475151Z] Loop 2314: Loss: 2.31e-03, Avg Return: 0.449, Regret: 0.3525, Entropy: 0.0967 +[2026-01-29T22:11:16.636824Z] Loop 2315: Loss: 2.32e-03, Avg Return: 0.455, Regret: 0.3525, Entropy: 0.0955 +[2026-01-29T22:11:17.804629Z] Loop 2316: Loss: 2.16e-03, Avg Return: 0.452, Regret: 0.3525, Entropy: 0.1002 +[2026-01-29T22:11:18.964274Z] Loop 2317: Loss: 2.01e-03, Avg Return: 0.452, Regret: 0.3525, Entropy: 0.0990 +[2026-01-29T22:11:20.124951Z] Loop 2318: Loss: 2.09e-03, Avg Return: 0.452, Regret: 0.3525, Entropy: 0.0975 +[2026-01-29T22:11:21.284751Z] Loop 2319: Loss: 2.11e-03, Avg Return: 0.452, Regret: 0.3525, Entropy: 0.1033 +[2026-01-29T22:11:22.497777Z] Loop 2320: Loss: 1.89e-03, Avg Return: 0.458, Regret: 0.3521, Entropy: 0.0926 +[2026-01-29T22:11:23.664179Z] Loop 2321: Loss: 1.97e-03, Avg Return: 0.453, Regret: 0.3521, Entropy: 0.0961 +[2026-01-29T22:11:24.826478Z] Loop 2322: Loss: 1.88e-03, Avg Return: 0.441, Regret: 0.3521, Entropy: 0.1025 +[2026-01-29T22:11:25.988945Z] Loop 2323: Loss: 1.92e-03, Avg Return: 0.451, Regret: 0.3521, Entropy: 0.0978 +[2026-01-29T22:11:27.149496Z] Loop 2324: Loss: 1.99e-03, Avg Return: 0.450, Regret: 0.3521, Entropy: 0.0941 +[2026-01-29T22:11:28.311559Z] Loop 2325: Loss: 2.01e-03, Avg Return: 0.457, Regret: 0.3521, Entropy: 0.0966 +[2026-01-29T22:11:29.474708Z] Loop 2326: Loss: 2.00e-03, Avg Return: 0.451, Regret: 0.3521, Entropy: 0.0972 +[2026-01-29T22:11:30.634115Z] Loop 2327: Loss: 1.87e-03, Avg Return: 0.450, Regret: 0.3521, Entropy: 0.0996 +[2026-01-29T22:11:31.795675Z] Loop 2328: Loss: 1.72e-03, Avg Return: 0.451, Regret: 0.3521, Entropy: 0.1042 +[2026-01-29T22:11:32.956202Z] Loop 2329: Loss: 2.12e-03, Avg Return: 0.451, Regret: 0.3521, Entropy: 0.1024 +[2026-01-29T22:11:34.164388Z] Loop 2330: Loss: 2.22e-03, Avg Return: 0.458, Regret: 0.3527, Entropy: 0.1021 +[2026-01-29T22:11:35.323445Z] Loop 2331: Loss: 1.72e-03, Avg Return: 0.448, Regret: 0.3527, Entropy: 0.0977 +[2026-01-29T22:11:36.484427Z] Loop 2332: Loss: 1.86e-03, Avg Return: 0.448, Regret: 0.3527, Entropy: 0.0980 +[2026-01-29T22:11:37.643749Z] Loop 2333: Loss: 2.01e-03, Avg Return: 0.450, Regret: 0.3527, Entropy: 0.0963 +[2026-01-29T22:11:38.804949Z] Loop 2334: Loss: 1.82e-03, Avg Return: 0.451, Regret: 0.3527, Entropy: 0.1003 +[2026-01-29T22:11:39.965110Z] Loop 2335: Loss: 1.68e-03, Avg Return: 0.456, Regret: 0.3527, Entropy: 0.0926 +[2026-01-29T22:11:41.125511Z] Loop 2336: Loss: 1.69e-03, Avg Return: 0.455, Regret: 0.3527, Entropy: 0.1036 +[2026-01-29T22:11:42.286255Z] Loop 2337: Loss: 1.76e-03, Avg Return: 0.456, Regret: 0.3527, Entropy: 0.1010 +[2026-01-29T22:11:43.445671Z] Loop 2338: Loss: 1.92e-03, Avg Return: 0.460, Regret: 0.3527, Entropy: 0.0978 +[2026-01-29T22:11:44.606680Z] Loop 2339: Loss: 1.73e-03, Avg Return: 0.448, Regret: 0.3527, Entropy: 0.0982 +[2026-01-29T22:11:45.814880Z] Loop 2340: Loss: 1.84e-03, Avg Return: 0.451, Regret: 0.3523, Entropy: 0.1023 +[2026-01-29T22:11:46.977344Z] Loop 2341: Loss: 1.80e-03, Avg Return: 0.449, Regret: 0.3523, Entropy: 0.1013 +[2026-01-29T22:11:48.139086Z] Loop 2342: Loss: 1.99e-03, Avg Return: 0.455, Regret: 0.3523, Entropy: 0.1005 +[2026-01-29T22:11:49.300892Z] Loop 2343: Loss: 2.02e-03, Avg Return: 0.450, Regret: 0.3523, Entropy: 0.1027 +[2026-01-29T22:11:50.460984Z] Loop 2344: Loss: 2.10e-03, Avg Return: 0.458, Regret: 0.3523, Entropy: 0.1023 +[2026-01-29T22:11:51.622004Z] Loop 2345: Loss: 2.16e-03, Avg Return: 0.446, Regret: 0.3523, Entropy: 0.1060 +[2026-01-29T22:11:52.783878Z] Loop 2346: Loss: 2.18e-03, Avg Return: 0.454, Regret: 0.3523, Entropy: 0.1090 +[2026-01-29T22:11:53.943705Z] Loop 2347: Loss: 1.89e-03, Avg Return: 0.453, Regret: 0.3523, Entropy: 0.1082 +[2026-01-29T22:11:55.104335Z] Loop 2348: Loss: 1.94e-03, Avg Return: 0.447, Regret: 0.3523, Entropy: 0.1059 +[2026-01-29T22:11:56.263920Z] Loop 2349: Loss: 2.05e-03, Avg Return: 0.450, Regret: 0.3523, Entropy: 0.1023 +[2026-01-29T22:11:57.474284Z] Loop 2350: Loss: 2.07e-03, Avg Return: 0.450, Regret: 0.3513, Entropy: 0.1025 +[2026-01-29T22:11:58.637083Z] Loop 2351: Loss: 2.68e-03, Avg Return: 0.447, Regret: 0.3513, Entropy: 0.0942 +[2026-01-29T22:11:59.800766Z] Loop 2352: Loss: 2.51e-03, Avg Return: 0.452, Regret: 0.3513, Entropy: 0.0991 +[2026-01-29T22:12:00.960247Z] Loop 2353: Loss: 3.03e-03, Avg Return: 0.449, Regret: 0.3513, Entropy: 0.1049 +[2026-01-29T22:12:02.122597Z] Loop 2354: Loss: 3.29e-03, Avg Return: 0.455, Regret: 0.3513, Entropy: 0.1007 +[2026-01-29T22:12:03.285329Z] Loop 2355: Loss: 3.73e-03, Avg Return: 0.457, Regret: 0.3513, Entropy: 0.1066 +[2026-01-29T22:12:04.444928Z] Loop 2356: Loss: 3.63e-03, Avg Return: 0.454, Regret: 0.3513, Entropy: 0.1038 +[2026-01-29T22:12:05.606296Z] Loop 2357: Loss: 3.43e-03, Avg Return: 0.458, Regret: 0.3513, Entropy: 0.1030 +[2026-01-29T22:12:06.766403Z] Loop 2358: Loss: 3.62e-03, Avg Return: 0.456, Regret: 0.3513, Entropy: 0.1134 +[2026-01-29T22:12:07.926570Z] Loop 2359: Loss: 3.68e-03, Avg Return: 0.453, Regret: 0.3513, Entropy: 0.1135 +[2026-01-29T22:12:09.137070Z] Loop 2360: Loss: 3.46e-03, Avg Return: 0.450, Regret: 0.3521, Entropy: 0.1066 +[2026-01-29T22:12:10.299440Z] Loop 2361: Loss: 3.12e-03, Avg Return: 0.451, Regret: 0.3521, Entropy: 0.1137 +[2026-01-29T22:12:11.461436Z] Loop 2362: Loss: 2.79e-03, Avg Return: 0.455, Regret: 0.3521, Entropy: 0.1060 +[2026-01-29T22:12:12.622310Z] Loop 2363: Loss: 2.29e-03, Avg Return: 0.453, Regret: 0.3521, Entropy: 0.1085 +[2026-01-29T22:12:13.784981Z] Loop 2364: Loss: 2.27e-03, Avg Return: 0.449, Regret: 0.3521, Entropy: 0.1032 +[2026-01-29T22:12:14.944482Z] Loop 2365: Loss: 2.57e-03, Avg Return: 0.450, Regret: 0.3521, Entropy: 0.1075 +[2026-01-29T22:12:16.104721Z] Loop 2366: Loss: 2.16e-03, Avg Return: 0.452, Regret: 0.3521, Entropy: 0.1110 +[2026-01-29T22:12:17.265196Z] Loop 2367: Loss: 2.16e-03, Avg Return: 0.454, Regret: 0.3521, Entropy: 0.1049 +[2026-01-29T22:12:18.425894Z] Loop 2368: Loss: 1.96e-03, Avg Return: 0.452, Regret: 0.3521, Entropy: 0.0988 +[2026-01-29T22:12:19.586706Z] Loop 2369: Loss: 1.64e-03, Avg Return: 0.452, Regret: 0.3521, Entropy: 0.1008 +[2026-01-29T22:12:20.790800Z] Loop 2370: Loss: 1.59e-03, Avg Return: 0.450, Regret: 0.3512, Entropy: 0.1018 +[2026-01-29T22:12:21.957931Z] Loop 2371: Loss: 1.70e-03, Avg Return: 0.453, Regret: 0.3512, Entropy: 0.0931 +[2026-01-29T22:12:23.118876Z] Loop 2372: Loss: 1.63e-03, Avg Return: 0.448, Regret: 0.3512, Entropy: 0.1018 +[2026-01-29T22:12:24.281260Z] Loop 2373: Loss: 2.25e-03, Avg Return: 0.448, Regret: 0.3512, Entropy: 0.1054 +[2026-01-29T22:12:25.442620Z] Loop 2374: Loss: 2.77e-03, Avg Return: 0.458, Regret: 0.3512, Entropy: 0.1090 +[2026-01-29T22:12:26.604419Z] Loop 2375: Loss: 3.42e-03, Avg Return: 0.451, Regret: 0.3512, Entropy: 0.1210 +[2026-01-29T22:12:27.765470Z] Loop 2376: Loss: 3.15e-03, Avg Return: 0.444, Regret: 0.3512, Entropy: 0.1118 +[2026-01-29T22:12:28.927190Z] Loop 2377: Loss: 3.06e-03, Avg Return: 0.446, Regret: 0.3512, Entropy: 0.1005 +[2026-01-29T22:12:30.089598Z] Loop 2378: Loss: 3.24e-03, Avg Return: 0.439, Regret: 0.3512, Entropy: 0.0999 +[2026-01-29T22:12:31.250053Z] Loop 2379: Loss: 2.66e-03, Avg Return: 0.446, Regret: 0.3512, Entropy: 0.1079 +[2026-01-29T22:12:32.456299Z] Loop 2380: Loss: 2.42e-03, Avg Return: 0.457, Regret: 0.3552, Entropy: 0.1047 +[2026-01-29T22:12:33.617476Z] Loop 2381: Loss: 3.12e-03, Avg Return: 0.454, Regret: 0.3552, Entropy: 0.1172 +[2026-01-29T22:12:34.777739Z] Loop 2382: Loss: 3.21e-03, Avg Return: 0.455, Regret: 0.3552, Entropy: 0.1227 +[2026-01-29T22:12:35.937276Z] Loop 2383: Loss: 2.87e-03, Avg Return: 0.449, Regret: 0.3552, Entropy: 0.1276 +[2026-01-29T22:12:37.096368Z] Loop 2384: Loss: 2.67e-03, Avg Return: 0.448, Regret: 0.3552, Entropy: 0.1179 +[2026-01-29T22:12:38.255596Z] Loop 2385: Loss: 1.98e-03, Avg Return: 0.453, Regret: 0.3552, Entropy: 0.1091 +[2026-01-29T22:12:39.414862Z] Loop 2386: Loss: 1.73e-03, Avg Return: 0.450, Regret: 0.3552, Entropy: 0.1155 +[2026-01-29T22:12:40.574717Z] Loop 2387: Loss: 1.88e-03, Avg Return: 0.450, Regret: 0.3552, Entropy: 0.1071 +[2026-01-29T22:12:41.733839Z] Loop 2388: Loss: 1.78e-03, Avg Return: 0.452, Regret: 0.3552, Entropy: 0.1116 +[2026-01-29T22:12:42.894385Z] Loop 2389: Loss: 1.65e-03, Avg Return: 0.452, Regret: 0.3552, Entropy: 0.1116 +[2026-01-29T22:12:44.096873Z] Loop 2390: Loss: 1.76e-03, Avg Return: 0.450, Regret: 0.3511, Entropy: 0.1143 +[2026-01-29T22:12:45.257557Z] Loop 2391: Loss: 1.85e-03, Avg Return: 0.451, Regret: 0.3511, Entropy: 0.1127 +[2026-01-29T22:12:46.417300Z] Loop 2392: Loss: 1.87e-03, Avg Return: 0.455, Regret: 0.3511, Entropy: 0.1217 +[2026-01-29T22:12:47.577339Z] Loop 2393: Loss: 2.15e-03, Avg Return: 0.451, Regret: 0.3511, Entropy: 0.1197 +[2026-01-29T22:12:48.736766Z] Loop 2394: Loss: 2.32e-03, Avg Return: 0.451, Regret: 0.3511, Entropy: 0.1166 +[2026-01-29T22:12:49.897527Z] Loop 2395: Loss: 2.28e-03, Avg Return: 0.455, Regret: 0.3511, Entropy: 0.1133 +[2026-01-29T22:12:51.056882Z] Loop 2396: Loss: 2.20e-03, Avg Return: 0.447, Regret: 0.3511, Entropy: 0.1218 +[2026-01-29T22:12:52.216627Z] Loop 2397: Loss: 2.52e-03, Avg Return: 0.456, Regret: 0.3511, Entropy: 0.1143 +[2026-01-29T22:12:53.375634Z] Loop 2398: Loss: 2.33e-03, Avg Return: 0.447, Regret: 0.3511, Entropy: 0.1121 +[2026-01-29T22:12:54.536112Z] Loop 2399: Loss: 2.69e-03, Avg Return: 0.452, Regret: 0.3511, Entropy: 0.1144 +[2026-01-29T22:12:55.741323Z] Loop 2400: Loss: 2.51e-03, Avg Return: 0.450, Regret: 0.3521, Entropy: 0.1136 +[2026-01-29T22:12:56.901867Z] Loop 2401: Loss: 2.39e-03, Avg Return: 0.444, Regret: 0.3521, Entropy: 0.1100 +[2026-01-29T22:12:58.061973Z] Loop 2402: Loss: 2.34e-03, Avg Return: 0.450, Regret: 0.3521, Entropy: 0.1163 +[2026-01-29T22:12:59.222489Z] Loop 2403: Loss: 2.23e-03, Avg Return: 0.448, Regret: 0.3521, Entropy: 0.1111 +[2026-01-29T22:13:00.387190Z] Loop 2404: Loss: 1.91e-03, Avg Return: 0.453, Regret: 0.3521, Entropy: 0.1052 +[2026-01-29T22:13:01.553459Z] Loop 2405: Loss: 2.09e-03, Avg Return: 0.454, Regret: 0.3521, Entropy: 0.1122 +[2026-01-29T22:13:02.713862Z] Loop 2406: Loss: 1.60e-03, Avg Return: 0.459, Regret: 0.3521, Entropy: 0.1058 +[2026-01-29T22:13:03.872986Z] Loop 2407: Loss: 1.79e-03, Avg Return: 0.456, Regret: 0.3521, Entropy: 0.1030 +[2026-01-29T22:13:05.033119Z] Loop 2408: Loss: 2.05e-03, Avg Return: 0.454, Regret: 0.3521, Entropy: 0.1138 +[2026-01-29T22:13:06.194145Z] Loop 2409: Loss: 2.38e-03, Avg Return: 0.449, Regret: 0.3521, Entropy: 0.1273 +[2026-01-29T22:13:07.398476Z] Loop 2410: Loss: 3.15e-03, Avg Return: 0.454, Regret: 0.3520, Entropy: 0.1313 +[2026-01-29T22:13:08.560036Z] Loop 2411: Loss: 3.14e-03, Avg Return: 0.457, Regret: 0.3520, Entropy: 0.1355 +[2026-01-29T22:13:09.720552Z] Loop 2412: Loss: 2.92e-03, Avg Return: 0.449, Regret: 0.3520, Entropy: 0.1367 +[2026-01-29T22:13:10.881041Z] Loop 2413: Loss: 2.86e-03, Avg Return: 0.448, Regret: 0.3520, Entropy: 0.1214 +[2026-01-29T22:13:12.040649Z] Loop 2414: Loss: 2.60e-03, Avg Return: 0.455, Regret: 0.3520, Entropy: 0.1190 +[2026-01-29T22:13:13.202214Z] Loop 2415: Loss: 2.33e-03, Avg Return: 0.453, Regret: 0.3520, Entropy: 0.1115 +[2026-01-29T22:13:14.367068Z] Loop 2416: Loss: 2.03e-03, Avg Return: 0.445, Regret: 0.3520, Entropy: 0.1110 +[2026-01-29T22:13:15.527303Z] Loop 2417: Loss: 2.06e-03, Avg Return: 0.442, Regret: 0.3520, Entropy: 0.1052 +[2026-01-29T22:13:16.689187Z] Loop 2418: Loss: 1.76e-03, Avg Return: 0.444, Regret: 0.3520, Entropy: 0.1073 +[2026-01-29T22:13:17.848686Z] Loop 2419: Loss: 2.18e-03, Avg Return: 0.451, Regret: 0.3520, Entropy: 0.1007 +[2026-01-29T22:13:19.056620Z] Loop 2420: Loss: 1.70e-03, Avg Return: 0.443, Regret: 0.3546, Entropy: 0.1101 +[2026-01-29T22:13:20.218343Z] Loop 2421: Loss: 2.01e-03, Avg Return: 0.449, Regret: 0.3546, Entropy: 0.1092 +[2026-01-29T22:13:21.380162Z] Loop 2422: Loss: 2.11e-03, Avg Return: 0.453, Regret: 0.3546, Entropy: 0.1107 +[2026-01-29T22:13:22.540788Z] Loop 2423: Loss: 2.31e-03, Avg Return: 0.446, Regret: 0.3546, Entropy: 0.1141 +[2026-01-29T22:13:23.702544Z] Loop 2424: Loss: 2.60e-03, Avg Return: 0.453, Regret: 0.3546, Entropy: 0.1103 +[2026-01-29T22:13:24.864763Z] Loop 2425: Loss: 2.59e-03, Avg Return: 0.453, Regret: 0.3546, Entropy: 0.1156 +[2026-01-29T22:13:26.025184Z] Loop 2426: Loss: 2.64e-03, Avg Return: 0.448, Regret: 0.3546, Entropy: 0.1128 +[2026-01-29T22:13:27.186366Z] Loop 2427: Loss: 2.14e-03, Avg Return: 0.443, Regret: 0.3546, Entropy: 0.1100 +[2026-01-29T22:13:28.346624Z] Loop 2428: Loss: 2.14e-03, Avg Return: 0.450, Regret: 0.3546, Entropy: 0.1113 +[2026-01-29T22:13:29.507592Z] Loop 2429: Loss: 2.60e-03, Avg Return: 0.459, Regret: 0.3546, Entropy: 0.1097 +[2026-01-29T22:13:30.713406Z] Loop 2430: Loss: 2.74e-03, Avg Return: 0.460, Regret: 0.3525, Entropy: 0.1096 +[2026-01-29T22:13:31.874290Z] Loop 2431: Loss: 2.19e-03, Avg Return: 0.456, Regret: 0.3525, Entropy: 0.1124 +[2026-01-29T22:13:33.034450Z] Loop 2432: Loss: 2.24e-03, Avg Return: 0.448, Regret: 0.3525, Entropy: 0.1094 +[2026-01-29T22:13:34.195485Z] Loop 2433: Loss: 2.12e-03, Avg Return: 0.449, Regret: 0.3525, Entropy: 0.1082 +[2026-01-29T22:13:35.355421Z] Loop 2434: Loss: 2.25e-03, Avg Return: 0.453, Regret: 0.3525, Entropy: 0.1124 +[2026-01-29T22:13:36.515937Z] Loop 2435: Loss: 2.24e-03, Avg Return: 0.450, Regret: 0.3525, Entropy: 0.1093 +[2026-01-29T22:13:37.677268Z] Loop 2436: Loss: 2.12e-03, Avg Return: 0.449, Regret: 0.3525, Entropy: 0.1107 +[2026-01-29T22:13:38.837978Z] Loop 2437: Loss: 2.40e-03, Avg Return: 0.453, Regret: 0.3525, Entropy: 0.1133 +[2026-01-29T22:13:39.999708Z] Loop 2438: Loss: 2.40e-03, Avg Return: 0.449, Regret: 0.3525, Entropy: 0.1108 +[2026-01-29T22:13:41.159794Z] Loop 2439: Loss: 2.43e-03, Avg Return: 0.448, Regret: 0.3525, Entropy: 0.1188 +[2026-01-29T22:13:42.365915Z] Loop 2440: Loss: 2.58e-03, Avg Return: 0.456, Regret: 0.3517, Entropy: 0.1098 +[2026-01-29T22:13:43.525823Z] Loop 2441: Loss: 2.70e-03, Avg Return: 0.447, Regret: 0.3517, Entropy: 0.1226 +[2026-01-29T22:13:44.687073Z] Loop 2442: Loss: 2.78e-03, Avg Return: 0.453, Regret: 0.3517, Entropy: 0.1156 +[2026-01-29T22:13:45.846725Z] Loop 2443: Loss: 2.85e-03, Avg Return: 0.452, Regret: 0.3517, Entropy: 0.1232 +[2026-01-29T22:13:47.007188Z] Loop 2444: Loss: 2.86e-03, Avg Return: 0.450, Regret: 0.3517, Entropy: 0.1185 +[2026-01-29T22:13:48.166833Z] Loop 2445: Loss: 2.99e-03, Avg Return: 0.451, Regret: 0.3517, Entropy: 0.1274 +[2026-01-29T22:13:49.326839Z] Loop 2446: Loss: 2.78e-03, Avg Return: 0.442, Regret: 0.3517, Entropy: 0.1234 +[2026-01-29T22:13:50.487758Z] Loop 2447: Loss: 2.95e-03, Avg Return: 0.441, Regret: 0.3517, Entropy: 0.1173 +[2026-01-29T22:13:51.647666Z] Loop 2448: Loss: 2.71e-03, Avg Return: 0.455, Regret: 0.3517, Entropy: 0.1193 +[2026-01-29T22:13:52.808616Z] Loop 2449: Loss: 2.75e-03, Avg Return: 0.455, Regret: 0.3517, Entropy: 0.1110 +[2026-01-29T22:13:54.014290Z] Loop 2450: Loss: 2.52e-03, Avg Return: 0.450, Regret: 0.3523, Entropy: 0.1115 +[2026-01-29T22:13:55.175505Z] Loop 2451: Loss: 2.41e-03, Avg Return: 0.454, Regret: 0.3523, Entropy: 0.1082 +[2026-01-29T22:13:56.335213Z] Loop 2452: Loss: 2.27e-03, Avg Return: 0.448, Regret: 0.3523, Entropy: 0.1046 +[2026-01-29T22:13:57.496198Z] Loop 2453: Loss: 2.16e-03, Avg Return: 0.450, Regret: 0.3523, Entropy: 0.0970 +[2026-01-29T22:13:58.655936Z] Loop 2454: Loss: 2.04e-03, Avg Return: 0.449, Regret: 0.3523, Entropy: 0.0927 +[2026-01-29T22:13:59.816346Z] Loop 2455: Loss: 2.07e-03, Avg Return: 0.438, Regret: 0.3523, Entropy: 0.1002 +[2026-01-29T22:14:00.978029Z] Loop 2456: Loss: 2.26e-03, Avg Return: 0.446, Regret: 0.3523, Entropy: 0.1049 +[2026-01-29T22:14:02.138493Z] Loop 2457: Loss: 2.03e-03, Avg Return: 0.456, Regret: 0.3523, Entropy: 0.0968 +[2026-01-29T22:14:03.299683Z] Loop 2458: Loss: 2.27e-03, Avg Return: 0.459, Regret: 0.3523, Entropy: 0.0957 +[2026-01-29T22:14:04.459475Z] Loop 2459: Loss: 2.50e-03, Avg Return: 0.458, Regret: 0.3523, Entropy: 0.1041 +[2026-01-29T22:14:05.673130Z] Loop 2460: Loss: 2.63e-03, Avg Return: 0.444, Regret: 0.3537, Entropy: 0.1091 +[2026-01-29T22:14:06.833965Z] Loop 2461: Loss: 2.63e-03, Avg Return: 0.443, Regret: 0.3537, Entropy: 0.1183 +[2026-01-29T22:14:07.995339Z] Loop 2462: Loss: 2.98e-03, Avg Return: 0.443, Regret: 0.3537, Entropy: 0.1231 +[2026-01-29T22:14:09.155337Z] Loop 2463: Loss: 3.28e-03, Avg Return: 0.452, Regret: 0.3537, Entropy: 0.1320 +[2026-01-29T22:14:10.316449Z] Loop 2464: Loss: 3.55e-03, Avg Return: 0.451, Regret: 0.3537, Entropy: 0.1361 +[2026-01-29T22:14:11.477717Z] Loop 2465: Loss: 3.56e-03, Avg Return: 0.450, Regret: 0.3537, Entropy: 0.1400 +[2026-01-29T22:14:12.637728Z] Loop 2466: Loss: 3.57e-03, Avg Return: 0.453, Regret: 0.3537, Entropy: 0.1305 +[2026-01-29T22:14:13.798908Z] Loop 2467: Loss: 2.99e-03, Avg Return: 0.454, Regret: 0.3537, Entropy: 0.1241 +[2026-01-29T22:14:14.959255Z] Loop 2468: Loss: 2.57e-03, Avg Return: 0.448, Regret: 0.3537, Entropy: 0.1157 +[2026-01-29T22:14:16.121057Z] Loop 2469: Loss: 2.56e-03, Avg Return: 0.452, Regret: 0.3537, Entropy: 0.1199 +[2026-01-29T22:14:17.329170Z] Loop 2470: Loss: 2.56e-03, Avg Return: 0.451, Regret: 0.3515, Entropy: 0.1086 +[2026-01-29T22:14:18.491310Z] Loop 2471: Loss: 2.73e-03, Avg Return: 0.454, Regret: 0.3515, Entropy: 0.1169 +[2026-01-29T22:14:19.650903Z] Loop 2472: Loss: 3.05e-03, Avg Return: 0.450, Regret: 0.3515, Entropy: 0.1251 +[2026-01-29T22:14:20.811035Z] Loop 2473: Loss: 3.03e-03, Avg Return: 0.458, Regret: 0.3515, Entropy: 0.1255 +[2026-01-29T22:14:21.971530Z] Loop 2474: Loss: 3.33e-03, Avg Return: 0.454, Regret: 0.3515, Entropy: 0.1289 +[2026-01-29T22:14:23.131168Z] Loop 2475: Loss: 3.21e-03, Avg Return: 0.450, Regret: 0.3515, Entropy: 0.1329 +[2026-01-29T22:14:24.292719Z] Loop 2476: Loss: 3.24e-03, Avg Return: 0.464, Regret: 0.3515, Entropy: 0.1258 +[2026-01-29T22:14:25.452968Z] Loop 2477: Loss: 2.75e-03, Avg Return: 0.451, Regret: 0.3515, Entropy: 0.1269 +[2026-01-29T22:14:26.613995Z] Loop 2478: Loss: 2.43e-03, Avg Return: 0.455, Regret: 0.3515, Entropy: 0.1141 +[2026-01-29T22:14:27.773432Z] Loop 2479: Loss: 2.46e-03, Avg Return: 0.451, Regret: 0.3515, Entropy: 0.1160 +[2026-01-29T22:14:28.979537Z] Loop 2480: Loss: 2.23e-03, Avg Return: 0.455, Regret: 0.3510, Entropy: 0.1119 +[2026-01-29T22:14:30.140888Z] Loop 2481: Loss: 2.42e-03, Avg Return: 0.453, Regret: 0.3510, Entropy: 0.1152 +[2026-01-29T22:14:31.301500Z] Loop 2482: Loss: 2.36e-03, Avg Return: 0.452, Regret: 0.3510, Entropy: 0.1078 +[2026-01-29T22:14:32.462899Z] Loop 2483: Loss: 2.06e-03, Avg Return: 0.451, Regret: 0.3510, Entropy: 0.1070 +[2026-01-29T22:14:33.623216Z] Loop 2484: Loss: 2.09e-03, Avg Return: 0.452, Regret: 0.3510, Entropy: 0.1068 +[2026-01-29T22:14:34.784763Z] Loop 2485: Loss: 2.06e-03, Avg Return: 0.454, Regret: 0.3510, Entropy: 0.1074 +[2026-01-29T22:14:35.944878Z] Loop 2486: Loss: 2.52e-03, Avg Return: 0.455, Regret: 0.3510, Entropy: 0.1030 +[2026-01-29T22:14:37.106038Z] Loop 2487: Loss: 2.65e-03, Avg Return: 0.455, Regret: 0.3510, Entropy: 0.1123 +[2026-01-29T22:14:38.266039Z] Loop 2488: Loss: 2.90e-03, Avg Return: 0.448, Regret: 0.3510, Entropy: 0.1146 +[2026-01-29T22:14:39.426222Z] Loop 2489: Loss: 2.63e-03, Avg Return: 0.449, Regret: 0.3510, Entropy: 0.1027 +[2026-01-29T22:14:40.634707Z] Loop 2490: Loss: 2.45e-03, Avg Return: 0.451, Regret: 0.3512, Entropy: 0.1078 +[2026-01-29T22:14:41.795139Z] Loop 2491: Loss: 2.75e-03, Avg Return: 0.458, Regret: 0.3512, Entropy: 0.1077 +[2026-01-29T22:14:42.955247Z] Loop 2492: Loss: 2.83e-03, Avg Return: 0.452, Regret: 0.3512, Entropy: 0.1036 +[2026-01-29T22:14:44.115855Z] Loop 2493: Loss: 2.71e-03, Avg Return: 0.448, Regret: 0.3512, Entropy: 0.1021 +[2026-01-29T22:14:45.277340Z] Loop 2494: Loss: 2.78e-03, Avg Return: 0.458, Regret: 0.3512, Entropy: 0.0998 +[2026-01-29T22:14:46.437427Z] Loop 2495: Loss: 2.54e-03, Avg Return: 0.450, Regret: 0.3512, Entropy: 0.0913 +[2026-01-29T22:14:47.598632Z] Loop 2496: Loss: 2.43e-03, Avg Return: 0.456, Regret: 0.3512, Entropy: 0.0901 +[2026-01-29T22:14:48.758699Z] Loop 2497: Loss: 2.30e-03, Avg Return: 0.452, Regret: 0.3512, Entropy: 0.0869 +[2026-01-29T22:14:49.919527Z] Loop 2498: Loss: 2.20e-03, Avg Return: 0.450, Regret: 0.3512, Entropy: 0.0845 +[2026-01-29T22:14:51.080881Z] Loop 2499: Loss: 2.23e-03, Avg Return: 0.454, Regret: 0.3512, Entropy: 0.0828 +[2026-01-29T22:14:52.286362Z] Loop 2500: Loss: 2.40e-03, Avg Return: 0.445, Regret: 0.3520, Entropy: 0.0838 +[2026-01-29T22:14:53.447203Z] Loop 2501: Loss: 2.30e-03, Avg Return: 0.443, Regret: 0.3520, Entropy: 0.0834 +[2026-01-29T22:14:54.608515Z] Loop 2502: Loss: 2.29e-03, Avg Return: 0.454, Regret: 0.3520, Entropy: 0.0792 +[2026-01-29T22:14:55.769107Z] Loop 2503: Loss: 2.10e-03, Avg Return: 0.453, Regret: 0.3520, Entropy: 0.0790 +[2026-01-29T22:14:56.930286Z] Loop 2504: Loss: 2.08e-03, Avg Return: 0.454, Regret: 0.3520, Entropy: 0.0778 +[2026-01-29T22:14:58.092063Z] Loop 2505: Loss: 2.42e-03, Avg Return: 0.456, Regret: 0.3520, Entropy: 0.0829 +[2026-01-29T22:14:59.252611Z] Loop 2506: Loss: 2.12e-03, Avg Return: 0.451, Regret: 0.3520, Entropy: 0.0859 +[2026-01-29T22:15:00.413376Z] Loop 2507: Loss: 2.25e-03, Avg Return: 0.464, Regret: 0.3520, Entropy: 0.0907 +[2026-01-29T22:15:01.574849Z] Loop 2508: Loss: 2.07e-03, Avg Return: 0.456, Regret: 0.3520, Entropy: 0.0966 +[2026-01-29T22:15:02.735229Z] Loop 2509: Loss: 1.94e-03, Avg Return: 0.450, Regret: 0.3520, Entropy: 0.0965 +[2026-01-29T22:15:03.942384Z] Loop 2510: Loss: 2.14e-03, Avg Return: 0.449, Regret: 0.3511, Entropy: 0.0974 +[2026-01-29T22:15:05.107134Z] Loop 2511: Loss: 1.83e-03, Avg Return: 0.455, Regret: 0.3511, Entropy: 0.0926 +[2026-01-29T22:15:06.269074Z] Loop 2512: Loss: 1.60e-03, Avg Return: 0.452, Regret: 0.3511, Entropy: 0.0946 +[2026-01-29T22:15:07.430657Z] Loop 2513: Loss: 1.54e-03, Avg Return: 0.449, Regret: 0.3511, Entropy: 0.0908 +[2026-01-29T22:15:08.593455Z] Loop 2514: Loss: 1.21e-03, Avg Return: 0.441, Regret: 0.3511, Entropy: 0.0910 +[2026-01-29T22:15:09.753735Z] Loop 2515: Loss: 1.67e-03, Avg Return: 0.449, Regret: 0.3511, Entropy: 0.0941 +[2026-01-29T22:15:10.919133Z] Loop 2516: Loss: 2.06e-03, Avg Return: 0.449, Regret: 0.3511, Entropy: 0.1017 +[2026-01-29T22:15:12.082641Z] Loop 2517: Loss: 2.89e-03, Avg Return: 0.455, Regret: 0.3511, Entropy: 0.1074 +[2026-01-29T22:15:13.244672Z] Loop 2518: Loss: 2.89e-03, Avg Return: 0.443, Regret: 0.3511, Entropy: 0.1124 +[2026-01-29T22:15:14.407136Z] Loop 2519: Loss: 2.88e-03, Avg Return: 0.452, Regret: 0.3511, Entropy: 0.1097 +[2026-01-29T22:15:15.619352Z] Loop 2520: Loss: 2.78e-03, Avg Return: 0.452, Regret: 0.3548, Entropy: 0.1168 +[2026-01-29T22:15:16.780616Z] Loop 2521: Loss: 2.65e-03, Avg Return: 0.446, Regret: 0.3548, Entropy: 0.1144 +[2026-01-29T22:15:17.940500Z] Loop 2522: Loss: 2.93e-03, Avg Return: 0.455, Regret: 0.3548, Entropy: 0.1044 +[2026-01-29T22:15:19.100119Z] Loop 2523: Loss: 2.43e-03, Avg Return: 0.443, Regret: 0.3548, Entropy: 0.1070 +[2026-01-29T22:15:20.259977Z] Loop 2524: Loss: 3.15e-03, Avg Return: 0.460, Regret: 0.3548, Entropy: 0.1105 +[2026-01-29T22:15:21.419394Z] Loop 2525: Loss: 2.72e-03, Avg Return: 0.455, Regret: 0.3548, Entropy: 0.1106 +[2026-01-29T22:15:22.580191Z] Loop 2526: Loss: 2.57e-03, Avg Return: 0.455, Regret: 0.3548, Entropy: 0.1072 +[2026-01-29T22:15:23.740784Z] Loop 2527: Loss: 1.99e-03, Avg Return: 0.457, Regret: 0.3548, Entropy: 0.0967 +[2026-01-29T22:15:24.901996Z] Loop 2528: Loss: 1.32e-03, Avg Return: 0.451, Regret: 0.3548, Entropy: 0.0861 +[2026-01-29T22:15:26.061892Z] Loop 2529: Loss: 1.08e-03, Avg Return: 0.454, Regret: 0.3548, Entropy: 0.0846 +[2026-01-29T22:15:27.268329Z] Loop 2530: Loss: 1.06e-03, Avg Return: 0.451, Regret: 0.3513, Entropy: 0.0806 +[2026-01-29T22:15:28.428886Z] Loop 2531: Loss: 1.34e-03, Avg Return: 0.449, Regret: 0.3513, Entropy: 0.0882 +[2026-01-29T22:15:29.591098Z] Loop 2532: Loss: 1.35e-03, Avg Return: 0.453, Regret: 0.3513, Entropy: 0.0805 +[2026-01-29T22:15:30.751536Z] Loop 2533: Loss: 1.70e-03, Avg Return: 0.452, Regret: 0.3513, Entropy: 0.0891 +[2026-01-29T22:15:31.912413Z] Loop 2534: Loss: 1.70e-03, Avg Return: 0.449, Regret: 0.3513, Entropy: 0.0912 +[2026-01-29T22:15:33.074371Z] Loop 2535: Loss: 2.02e-03, Avg Return: 0.453, Regret: 0.3513, Entropy: 0.0937 +[2026-01-29T22:15:34.235205Z] Loop 2536: Loss: 1.99e-03, Avg Return: 0.455, Regret: 0.3513, Entropy: 0.0933 +[2026-01-29T22:15:35.398247Z] Loop 2537: Loss: 2.37e-03, Avg Return: 0.461, Regret: 0.3513, Entropy: 0.0992 +[2026-01-29T22:15:36.558984Z] Loop 2538: Loss: 2.06e-03, Avg Return: 0.445, Regret: 0.3513, Entropy: 0.0960 +[2026-01-29T22:15:37.719988Z] Loop 2539: Loss: 1.92e-03, Avg Return: 0.453, Regret: 0.3513, Entropy: 0.0905 +[2026-01-29T22:15:38.931085Z] Loop 2540: Loss: 2.30e-03, Avg Return: 0.455, Regret: 0.3510, Entropy: 0.0898 +[2026-01-29T22:15:40.095218Z] Loop 2541: Loss: 2.60e-03, Avg Return: 0.459, Regret: 0.3510, Entropy: 0.0891 +[2026-01-29T22:15:41.256473Z] Loop 2542: Loss: 2.90e-03, Avg Return: 0.456, Regret: 0.3510, Entropy: 0.0873 +[2026-01-29T22:15:42.416374Z] Loop 2543: Loss: 2.59e-03, Avg Return: 0.452, Regret: 0.3510, Entropy: 0.0879 +[2026-01-29T22:15:43.577003Z] Loop 2544: Loss: 2.76e-03, Avg Return: 0.452, Regret: 0.3510, Entropy: 0.0878 +[2026-01-29T22:15:44.738238Z] Loop 2545: Loss: 2.80e-03, Avg Return: 0.457, Regret: 0.3510, Entropy: 0.0883 +[2026-01-29T22:15:45.899927Z] Loop 2546: Loss: 2.67e-03, Avg Return: 0.463, Regret: 0.3510, Entropy: 0.0897 +[2026-01-29T22:15:47.061200Z] Loop 2547: Loss: 2.60e-03, Avg Return: 0.451, Regret: 0.3510, Entropy: 0.0887 +[2026-01-29T22:15:48.221694Z] Loop 2548: Loss: 2.73e-03, Avg Return: 0.442, Regret: 0.3510, Entropy: 0.0920 +[2026-01-29T22:15:49.383385Z] Loop 2549: Loss: 2.91e-03, Avg Return: 0.456, Regret: 0.3510, Entropy: 0.0954 +[2026-01-29T22:15:50.598917Z] Loop 2550: Loss: 2.70e-03, Avg Return: 0.445, Regret: 0.3513, Entropy: 0.0866 +[2026-01-29T22:15:51.760024Z] Loop 2551: Loss: 2.97e-03, Avg Return: 0.454, Regret: 0.3513, Entropy: 0.0881 +[2026-01-29T22:15:52.920904Z] Loop 2552: Loss: 3.26e-03, Avg Return: 0.459, Regret: 0.3513, Entropy: 0.0875 +[2026-01-29T22:15:54.081781Z] Loop 2553: Loss: 3.19e-03, Avg Return: 0.444, Regret: 0.3513, Entropy: 0.0880 +[2026-01-29T22:15:55.242153Z] Loop 2554: Loss: 3.34e-03, Avg Return: 0.451, Regret: 0.3513, Entropy: 0.0896 +[2026-01-29T22:15:56.402902Z] Loop 2555: Loss: 3.56e-03, Avg Return: 0.449, Regret: 0.3513, Entropy: 0.0952 +[2026-01-29T22:15:57.564220Z] Loop 2556: Loss: 3.99e-03, Avg Return: 0.436, Regret: 0.3513, Entropy: 0.1020 +[2026-01-29T22:15:58.724068Z] Loop 2557: Loss: 4.30e-03, Avg Return: 0.447, Regret: 0.3513, Entropy: 0.1048 +[2026-01-29T22:15:59.885054Z] Loop 2558: Loss: 4.10e-03, Avg Return: 0.442, Regret: 0.3513, Entropy: 0.1039 +[2026-01-29T22:16:01.044965Z] Loop 2559: Loss: 3.02e-03, Avg Return: 0.441, Regret: 0.3513, Entropy: 0.0945 +[2026-01-29T22:16:02.252716Z] Loop 2560: Loss: 3.35e-03, Avg Return: 0.449, Regret: 0.3531, Entropy: 0.0938 +[2026-01-29T22:16:03.413435Z] Loop 2561: Loss: 3.07e-03, Avg Return: 0.453, Regret: 0.3531, Entropy: 0.0984 +[2026-01-29T22:16:04.574659Z] Loop 2562: Loss: 3.06e-03, Avg Return: 0.454, Regret: 0.3531, Entropy: 0.0954 +[2026-01-29T22:16:05.734716Z] Loop 2563: Loss: 2.65e-03, Avg Return: 0.459, Regret: 0.3531, Entropy: 0.0979 +[2026-01-29T22:16:06.895431Z] Loop 2564: Loss: 2.38e-03, Avg Return: 0.456, Regret: 0.3531, Entropy: 0.0946 +[2026-01-29T22:16:08.056662Z] Loop 2565: Loss: 2.02e-03, Avg Return: 0.455, Regret: 0.3531, Entropy: 0.0933 +[2026-01-29T22:16:09.217110Z] Loop 2566: Loss: 1.82e-03, Avg Return: 0.451, Regret: 0.3531, Entropy: 0.0915 +[2026-01-29T22:16:10.378415Z] Loop 2567: Loss: 1.79e-03, Avg Return: 0.455, Regret: 0.3531, Entropy: 0.0847 +[2026-01-29T22:16:11.539897Z] Loop 2568: Loss: 1.66e-03, Avg Return: 0.453, Regret: 0.3531, Entropy: 0.0888 +[2026-01-29T22:16:12.700266Z] Loop 2569: Loss: 1.48e-03, Avg Return: 0.452, Regret: 0.3531, Entropy: 0.0961 +[2026-01-29T22:16:13.908079Z] Loop 2570: Loss: 1.48e-03, Avg Return: 0.452, Regret: 0.3511, Entropy: 0.0899 +[2026-01-29T22:16:15.068311Z] Loop 2571: Loss: 1.66e-03, Avg Return: 0.456, Regret: 0.3511, Entropy: 0.0891 +[2026-01-29T22:16:16.228622Z] Loop 2572: Loss: 1.52e-03, Avg Return: 0.451, Regret: 0.3511, Entropy: 0.0913 +[2026-01-29T22:16:17.390207Z] Loop 2573: Loss: 1.62e-03, Avg Return: 0.451, Regret: 0.3511, Entropy: 0.0880 +[2026-01-29T22:16:18.551823Z] Loop 2574: Loss: 1.71e-03, Avg Return: 0.451, Regret: 0.3511, Entropy: 0.0923 +[2026-01-29T22:16:19.712581Z] Loop 2575: Loss: 1.78e-03, Avg Return: 0.451, Regret: 0.3511, Entropy: 0.1000 +[2026-01-29T22:16:20.873532Z] Loop 2576: Loss: 1.96e-03, Avg Return: 0.450, Regret: 0.3511, Entropy: 0.0955 +[2026-01-29T22:16:22.036519Z] Loop 2577: Loss: 1.83e-03, Avg Return: 0.452, Regret: 0.3511, Entropy: 0.0917 +[2026-01-29T22:16:23.196682Z] Loop 2578: Loss: 1.64e-03, Avg Return: 0.450, Regret: 0.3511, Entropy: 0.0959 +[2026-01-29T22:16:24.355856Z] Loop 2579: Loss: 1.82e-03, Avg Return: 0.446, Regret: 0.3511, Entropy: 0.0953 +[2026-01-29T22:16:25.564620Z] Loop 2580: Loss: 1.89e-03, Avg Return: 0.453, Regret: 0.3520, Entropy: 0.0957 +[2026-01-29T22:16:26.728262Z] Loop 2581: Loss: 1.74e-03, Avg Return: 0.457, Regret: 0.3520, Entropy: 0.0942 +[2026-01-29T22:16:27.890335Z] Loop 2582: Loss: 1.80e-03, Avg Return: 0.453, Regret: 0.3520, Entropy: 0.0964 +[2026-01-29T22:16:29.052144Z] Loop 2583: Loss: 1.82e-03, Avg Return: 0.449, Regret: 0.3520, Entropy: 0.0927 +[2026-01-29T22:16:30.212891Z] Loop 2584: Loss: 1.71e-03, Avg Return: 0.448, Regret: 0.3520, Entropy: 0.0966 +[2026-01-29T22:16:31.375285Z] Loop 2585: Loss: 1.44e-03, Avg Return: 0.453, Regret: 0.3520, Entropy: 0.0866 +[2026-01-29T22:16:32.537158Z] Loop 2586: Loss: 1.90e-03, Avg Return: 0.453, Regret: 0.3520, Entropy: 0.0947 +[2026-01-29T22:16:33.698404Z] Loop 2587: Loss: 1.96e-03, Avg Return: 0.452, Regret: 0.3520, Entropy: 0.0924 +[2026-01-29T22:16:34.859479Z] Loop 2588: Loss: 1.82e-03, Avg Return: 0.450, Regret: 0.3520, Entropy: 0.0960 +[2026-01-29T22:16:36.019825Z] Loop 2589: Loss: 1.81e-03, Avg Return: 0.459, Regret: 0.3520, Entropy: 0.0859 +[2026-01-29T22:16:37.230306Z] Loop 2590: Loss: 1.58e-03, Avg Return: 0.447, Regret: 0.3512, Entropy: 0.0914 +[2026-01-29T22:16:38.391707Z] Loop 2591: Loss: 1.80e-03, Avg Return: 0.459, Regret: 0.3512, Entropy: 0.0916 +[2026-01-29T22:16:39.553487Z] Loop 2592: Loss: 1.44e-03, Avg Return: 0.455, Regret: 0.3512, Entropy: 0.0928 +[2026-01-29T22:16:40.713365Z] Loop 2593: Loss: 1.72e-03, Avg Return: 0.449, Regret: 0.3512, Entropy: 0.0937 +[2026-01-29T22:16:41.875209Z] Loop 2594: Loss: 1.48e-03, Avg Return: 0.454, Regret: 0.3512, Entropy: 0.0905 +[2026-01-29T22:16:43.036218Z] Loop 2595: Loss: 1.78e-03, Avg Return: 0.459, Regret: 0.3512, Entropy: 0.0931 +[2026-01-29T22:16:44.196699Z] Loop 2596: Loss: 1.99e-03, Avg Return: 0.451, Regret: 0.3512, Entropy: 0.0942 +[2026-01-29T22:16:45.356554Z] Loop 2597: Loss: 1.70e-03, Avg Return: 0.456, Regret: 0.3512, Entropy: 0.0964 +[2026-01-29T22:16:46.516923Z] Loop 2598: Loss: 1.67e-03, Avg Return: 0.460, Regret: 0.3512, Entropy: 0.0936 +[2026-01-29T22:16:47.678476Z] Loop 2599: Loss: 1.83e-03, Avg Return: 0.449, Regret: 0.3512, Entropy: 0.0918 +[2026-01-29T22:16:48.885673Z] Loop 2600: Loss: 1.82e-03, Avg Return: 0.449, Regret: 0.3510, Entropy: 0.0930 +[2026-01-29T22:16:50.050224Z] Loop 2601: Loss: 1.95e-03, Avg Return: 0.458, Regret: 0.3510, Entropy: 0.0899 +[2026-01-29T22:16:51.210784Z] Loop 2602: Loss: 1.95e-03, Avg Return: 0.450, Regret: 0.3510, Entropy: 0.0972 +[2026-01-29T22:16:52.372523Z] Loop 2603: Loss: 2.18e-03, Avg Return: 0.452, Regret: 0.3510, Entropy: 0.0947 +[2026-01-29T22:16:53.536804Z] Loop 2604: Loss: 2.03e-03, Avg Return: 0.464, Regret: 0.3510, Entropy: 0.1003 +[2026-01-29T22:16:54.699258Z] Loop 2605: Loss: 2.07e-03, Avg Return: 0.452, Regret: 0.3510, Entropy: 0.0892 +[2026-01-29T22:16:55.861441Z] Loop 2606: Loss: 2.14e-03, Avg Return: 0.454, Regret: 0.3510, Entropy: 0.0926 +[2026-01-29T22:16:57.021278Z] Loop 2607: Loss: 2.50e-03, Avg Return: 0.450, Regret: 0.3510, Entropy: 0.0961 +[2026-01-29T22:16:58.183681Z] Loop 2608: Loss: 2.61e-03, Avg Return: 0.453, Regret: 0.3510, Entropy: 0.1010 +[2026-01-29T22:16:59.345430Z] Loop 2609: Loss: 2.98e-03, Avg Return: 0.456, Regret: 0.3510, Entropy: 0.0951 +[2026-01-29T22:17:00.560258Z] Loop 2610: Loss: 2.51e-03, Avg Return: 0.453, Regret: 0.3513, Entropy: 0.0963 +[2026-01-29T22:17:01.722040Z] Loop 2611: Loss: 2.33e-03, Avg Return: 0.456, Regret: 0.3513, Entropy: 0.0912 +[2026-01-29T22:17:02.883017Z] Loop 2612: Loss: 2.04e-03, Avg Return: 0.459, Regret: 0.3513, Entropy: 0.0881 +[2026-01-29T22:17:04.044561Z] Loop 2613: Loss: 1.80e-03, Avg Return: 0.453, Regret: 0.3513, Entropy: 0.0890 +[2026-01-29T22:17:05.204542Z] Loop 2614: Loss: 1.83e-03, Avg Return: 0.453, Regret: 0.3513, Entropy: 0.0900 +[2026-01-29T22:17:06.365771Z] Loop 2615: Loss: 1.81e-03, Avg Return: 0.455, Regret: 0.3513, Entropy: 0.0848 +[2026-01-29T22:17:07.525688Z] Loop 2616: Loss: 1.63e-03, Avg Return: 0.462, Regret: 0.3513, Entropy: 0.0855 +[2026-01-29T22:17:08.690457Z] Loop 2617: Loss: 1.71e-03, Avg Return: 0.452, Regret: 0.3513, Entropy: 0.0886 +[2026-01-29T22:17:09.851903Z] Loop 2618: Loss: 1.83e-03, Avg Return: 0.450, Regret: 0.3513, Entropy: 0.0915 +[2026-01-29T22:17:11.012549Z] Loop 2619: Loss: 1.86e-03, Avg Return: 0.450, Regret: 0.3513, Entropy: 0.0992 +[2026-01-29T22:17:12.221615Z] Loop 2620: Loss: 1.80e-03, Avg Return: 0.453, Regret: 0.3513, Entropy: 0.0925 +[2026-01-29T22:17:13.382891Z] Loop 2621: Loss: 1.47e-03, Avg Return: 0.458, Regret: 0.3513, Entropy: 0.0942 +[2026-01-29T22:17:14.543954Z] Loop 2622: Loss: 1.60e-03, Avg Return: 0.454, Regret: 0.3513, Entropy: 0.0861 +[2026-01-29T22:17:15.702991Z] Loop 2623: Loss: 1.49e-03, Avg Return: 0.450, Regret: 0.3513, Entropy: 0.0891 +[2026-01-29T22:17:16.863904Z] Loop 2624: Loss: 1.53e-03, Avg Return: 0.453, Regret: 0.3513, Entropy: 0.0878 +[2026-01-29T22:17:18.023573Z] Loop 2625: Loss: 1.75e-03, Avg Return: 0.449, Regret: 0.3513, Entropy: 0.0865 +[2026-01-29T22:17:19.184142Z] Loop 2626: Loss: 1.77e-03, Avg Return: 0.450, Regret: 0.3513, Entropy: 0.0789 +[2026-01-29T22:17:20.344355Z] Loop 2627: Loss: 1.66e-03, Avg Return: 0.455, Regret: 0.3513, Entropy: 0.0810 +[2026-01-29T22:17:21.504398Z] Loop 2628: Loss: 1.57e-03, Avg Return: 0.454, Regret: 0.3513, Entropy: 0.0792 +[2026-01-29T22:17:22.665498Z] Loop 2629: Loss: 1.63e-03, Avg Return: 0.453, Regret: 0.3513, Entropy: 0.0830 +[2026-01-29T22:17:23.870711Z] Loop 2630: Loss: 1.64e-03, Avg Return: 0.450, Regret: 0.3516, Entropy: 0.0809 +[2026-01-29T22:17:25.034679Z] Loop 2631: Loss: 1.67e-03, Avg Return: 0.452, Regret: 0.3516, Entropy: 0.0822 +[2026-01-29T22:17:26.195278Z] Loop 2632: Loss: 1.41e-03, Avg Return: 0.448, Regret: 0.3516, Entropy: 0.0824 +[2026-01-29T22:17:27.355977Z] Loop 2633: Loss: 1.42e-03, Avg Return: 0.456, Regret: 0.3516, Entropy: 0.0751 +[2026-01-29T22:17:28.516761Z] Loop 2634: Loss: 1.25e-03, Avg Return: 0.453, Regret: 0.3516, Entropy: 0.0885 +[2026-01-29T22:17:29.678105Z] Loop 2635: Loss: 1.44e-03, Avg Return: 0.452, Regret: 0.3516, Entropy: 0.0904 +[2026-01-29T22:17:30.838667Z] Loop 2636: Loss: 1.16e-03, Avg Return: 0.450, Regret: 0.3516, Entropy: 0.0816 +[2026-01-29T22:17:31.997333Z] Loop 2637: Loss: 1.55e-03, Avg Return: 0.450, Regret: 0.3516, Entropy: 0.0877 +[2026-01-29T22:17:33.157884Z] Loop 2638: Loss: 1.45e-03, Avg Return: 0.451, Regret: 0.3516, Entropy: 0.0826 +[2026-01-29T22:17:34.317739Z] Loop 2639: Loss: 1.42e-03, Avg Return: 0.446, Regret: 0.3516, Entropy: 0.0861 +[2026-01-29T22:17:35.525160Z] Loop 2640: Loss: 1.31e-03, Avg Return: 0.447, Regret: 0.3518, Entropy: 0.0787 +[2026-01-29T22:17:36.687845Z] Loop 2641: Loss: 1.30e-03, Avg Return: 0.452, Regret: 0.3518, Entropy: 0.0849 +[2026-01-29T22:17:37.849899Z] Loop 2642: Loss: 1.36e-03, Avg Return: 0.458, Regret: 0.3518, Entropy: 0.0771 +[2026-01-29T22:17:39.010853Z] Loop 2643: Loss: 1.39e-03, Avg Return: 0.448, Regret: 0.3518, Entropy: 0.0843 +[2026-01-29T22:17:40.174468Z] Loop 2644: Loss: 1.51e-03, Avg Return: 0.447, Regret: 0.3518, Entropy: 0.0831 +[2026-01-29T22:17:41.337021Z] Loop 2645: Loss: 1.70e-03, Avg Return: 0.451, Regret: 0.3518, Entropy: 0.0845 +[2026-01-29T22:17:42.497287Z] Loop 2646: Loss: 2.18e-03, Avg Return: 0.453, Regret: 0.3518, Entropy: 0.0783 +[2026-01-29T22:17:43.659715Z] Loop 2647: Loss: 2.18e-03, Avg Return: 0.455, Regret: 0.3518, Entropy: 0.0797 +[2026-01-29T22:17:44.820992Z] Loop 2648: Loss: 2.40e-03, Avg Return: 0.460, Regret: 0.3518, Entropy: 0.0782 +[2026-01-29T22:17:45.983621Z] Loop 2649: Loss: 2.76e-03, Avg Return: 0.452, Regret: 0.3518, Entropy: 0.0791 +[2026-01-29T22:17:47.197398Z] Loop 2650: Loss: 2.71e-03, Avg Return: 0.453, Regret: 0.3516, Entropy: 0.0788 +[2026-01-29T22:17:48.358171Z] Loop 2651: Loss: 3.12e-03, Avg Return: 0.450, Regret: 0.3516, Entropy: 0.0809 +[2026-01-29T22:17:49.518557Z] Loop 2652: Loss: 3.20e-03, Avg Return: 0.449, Regret: 0.3516, Entropy: 0.0849 +[2026-01-29T22:17:50.679846Z] Loop 2653: Loss: 3.25e-03, Avg Return: 0.449, Regret: 0.3516, Entropy: 0.0842 +[2026-01-29T22:17:51.842008Z] Loop 2654: Loss: 3.37e-03, Avg Return: 0.452, Regret: 0.3516, Entropy: 0.0844 +[2026-01-29T22:17:53.002662Z] Loop 2655: Loss: 3.36e-03, Avg Return: 0.452, Regret: 0.3516, Entropy: 0.0818 +[2026-01-29T22:17:54.163959Z] Loop 2656: Loss: 3.36e-03, Avg Return: 0.453, Regret: 0.3516, Entropy: 0.0834 +[2026-01-29T22:17:55.324512Z] Loop 2657: Loss: 2.46e-03, Avg Return: 0.451, Regret: 0.3516, Entropy: 0.0770 +[2026-01-29T22:17:56.486391Z] Loop 2658: Loss: 2.13e-03, Avg Return: 0.450, Regret: 0.3516, Entropy: 0.0717 +[2026-01-29T22:17:57.649459Z] Loop 2659: Loss: 2.02e-03, Avg Return: 0.448, Regret: 0.3516, Entropy: 0.0720 +[2026-01-29T22:17:58.855309Z] Loop 2660: Loss: 2.17e-03, Avg Return: 0.456, Regret: 0.3510, Entropy: 0.0813 +[2026-01-29T22:18:00.017097Z] Loop 2661: Loss: 1.59e-03, Avg Return: 0.447, Regret: 0.3510, Entropy: 0.0823 +[2026-01-29T22:18:01.176849Z] Loop 2662: Loss: 1.31e-03, Avg Return: 0.460, Regret: 0.3510, Entropy: 0.0848 +[2026-01-29T22:18:02.336648Z] Loop 2663: Loss: 1.49e-03, Avg Return: 0.445, Regret: 0.3510, Entropy: 0.0820 +[2026-01-29T22:18:03.495963Z] Loop 2664: Loss: 1.85e-03, Avg Return: 0.453, Regret: 0.3510, Entropy: 0.0918 +[2026-01-29T22:18:04.656587Z] Loop 2665: Loss: 1.46e-03, Avg Return: 0.453, Regret: 0.3510, Entropy: 0.0856 +[2026-01-29T22:18:05.815715Z] Loop 2666: Loss: 9.78e-04, Avg Return: 0.447, Regret: 0.3510, Entropy: 0.0793 +[2026-01-29T22:18:06.976043Z] Loop 2667: Loss: 8.68e-04, Avg Return: 0.444, Regret: 0.3510, Entropy: 0.0738 +[2026-01-29T22:18:08.137787Z] Loop 2668: Loss: 9.57e-04, Avg Return: 0.453, Regret: 0.3510, Entropy: 0.0737 +[2026-01-29T22:18:09.298124Z] Loop 2669: Loss: 1.09e-03, Avg Return: 0.454, Regret: 0.3510, Entropy: 0.0786 +[2026-01-29T22:18:10.505314Z] Loop 2670: Loss: 1.38e-03, Avg Return: 0.456, Regret: 0.3539, Entropy: 0.0799 +[2026-01-29T22:18:11.666410Z] Loop 2671: Loss: 1.70e-03, Avg Return: 0.449, Regret: 0.3539, Entropy: 0.0909 +[2026-01-29T22:18:12.831191Z] Loop 2672: Loss: 2.00e-03, Avg Return: 0.446, Regret: 0.3539, Entropy: 0.0892 +[2026-01-29T22:18:13.991823Z] Loop 2673: Loss: 2.00e-03, Avg Return: 0.447, Regret: 0.3539, Entropy: 0.0851 +[2026-01-29T22:18:15.154120Z] Loop 2674: Loss: 1.63e-03, Avg Return: 0.452, Regret: 0.3539, Entropy: 0.0824 +[2026-01-29T22:18:16.314898Z] Loop 2675: Loss: 1.52e-03, Avg Return: 0.450, Regret: 0.3539, Entropy: 0.0872 +[2026-01-29T22:18:17.477276Z] Loop 2676: Loss: 1.64e-03, Avg Return: 0.445, Regret: 0.3539, Entropy: 0.0845 +[2026-01-29T22:18:18.640595Z] Loop 2677: Loss: 1.54e-03, Avg Return: 0.452, Regret: 0.3539, Entropy: 0.0799 +[2026-01-29T22:18:19.801547Z] Loop 2678: Loss: 1.27e-03, Avg Return: 0.447, Regret: 0.3539, Entropy: 0.0854 +[2026-01-29T22:18:20.963112Z] Loop 2679: Loss: 1.42e-03, Avg Return: 0.451, Regret: 0.3539, Entropy: 0.0797 +[2026-01-29T22:18:22.179184Z] Loop 2680: Loss: 1.55e-03, Avg Return: 0.449, Regret: 0.3527, Entropy: 0.0798 +[2026-01-29T22:18:23.340782Z] Loop 2681: Loss: 1.33e-03, Avg Return: 0.452, Regret: 0.3527, Entropy: 0.0790 +[2026-01-29T22:18:24.500989Z] Loop 2682: Loss: 1.14e-03, Avg Return: 0.451, Regret: 0.3527, Entropy: 0.0814 +[2026-01-29T22:18:25.661732Z] Loop 2683: Loss: 1.10e-03, Avg Return: 0.457, Regret: 0.3527, Entropy: 0.0752 +[2026-01-29T22:18:26.822672Z] Loop 2684: Loss: 8.46e-04, Avg Return: 0.453, Regret: 0.3527, Entropy: 0.0786 +[2026-01-29T22:18:27.983504Z] Loop 2685: Loss: 9.88e-04, Avg Return: 0.459, Regret: 0.3527, Entropy: 0.0787 +[2026-01-29T22:18:29.145131Z] Loop 2686: Loss: 1.03e-03, Avg Return: 0.456, Regret: 0.3527, Entropy: 0.0780 +[2026-01-29T22:18:30.305516Z] Loop 2687: Loss: 1.08e-03, Avg Return: 0.450, Regret: 0.3527, Entropy: 0.0778 +[2026-01-29T22:18:31.466607Z] Loop 2688: Loss: 9.54e-04, Avg Return: 0.451, Regret: 0.3527, Entropy: 0.0785 +[2026-01-29T22:18:32.628825Z] Loop 2689: Loss: 1.03e-03, Avg Return: 0.455, Regret: 0.3527, Entropy: 0.0750 +[2026-01-29T22:18:33.834792Z] Loop 2690: Loss: 1.17e-03, Avg Return: 0.454, Regret: 0.3511, Entropy: 0.0776 +[2026-01-29T22:18:34.996156Z] Loop 2691: Loss: 1.12e-03, Avg Return: 0.450, Regret: 0.3511, Entropy: 0.0796 +[2026-01-29T22:18:36.157123Z] Loop 2692: Loss: 1.01e-03, Avg Return: 0.448, Regret: 0.3511, Entropy: 0.0802 +[2026-01-29T22:18:37.317406Z] Loop 2693: Loss: 1.06e-03, Avg Return: 0.452, Regret: 0.3511, Entropy: 0.0821 +[2026-01-29T22:18:38.477548Z] Loop 2694: Loss: 1.13e-03, Avg Return: 0.458, Regret: 0.3511, Entropy: 0.0801 +[2026-01-29T22:18:39.638849Z] Loop 2695: Loss: 1.17e-03, Avg Return: 0.453, Regret: 0.3511, Entropy: 0.0824 +[2026-01-29T22:18:40.799206Z] Loop 2696: Loss: 1.22e-03, Avg Return: 0.454, Regret: 0.3511, Entropy: 0.0829 +[2026-01-29T22:18:41.960652Z] Loop 2697: Loss: 1.06e-03, Avg Return: 0.453, Regret: 0.3511, Entropy: 0.0817 +[2026-01-29T22:18:43.120828Z] Loop 2698: Loss: 1.04e-03, Avg Return: 0.455, Regret: 0.3511, Entropy: 0.0811 +[2026-01-29T22:18:44.281638Z] Loop 2699: Loss: 9.99e-04, Avg Return: 0.447, Regret: 0.3511, Entropy: 0.0824 +[2026-01-29T22:18:45.488134Z] Loop 2700: Loss: 1.02e-03, Avg Return: 0.456, Regret: 0.3510, Entropy: 0.0817 +[2026-01-29T22:18:46.651798Z] Loop 2701: Loss: 1.03e-03, Avg Return: 0.452, Regret: 0.3510, Entropy: 0.0772 +[2026-01-29T22:18:47.810617Z] Loop 2702: Loss: 9.75e-04, Avg Return: 0.452, Regret: 0.3510, Entropy: 0.0796 +[2026-01-29T22:18:48.971295Z] Loop 2703: Loss: 1.05e-03, Avg Return: 0.455, Regret: 0.3510, Entropy: 0.0796 +[2026-01-29T22:18:50.133039Z] Loop 2704: Loss: 1.00e-03, Avg Return: 0.453, Regret: 0.3510, Entropy: 0.0797 +[2026-01-29T22:18:51.293626Z] Loop 2705: Loss: 1.02e-03, Avg Return: 0.450, Regret: 0.3510, Entropy: 0.0832 +[2026-01-29T22:18:52.454928Z] Loop 2706: Loss: 1.01e-03, Avg Return: 0.451, Regret: 0.3510, Entropy: 0.0820 +[2026-01-29T22:18:53.615219Z] Loop 2707: Loss: 9.82e-04, Avg Return: 0.457, Regret: 0.3510, Entropy: 0.0864 +[2026-01-29T22:18:54.775804Z] Loop 2708: Loss: 1.00e-03, Avg Return: 0.458, Regret: 0.3510, Entropy: 0.0808 +[2026-01-29T22:18:55.936997Z] Loop 2709: Loss: 7.46e-04, Avg Return: 0.450, Regret: 0.3510, Entropy: 0.0791 +[2026-01-29T22:18:57.153140Z] Loop 2710: Loss: 1.05e-03, Avg Return: 0.451, Regret: 0.3510, Entropy: 0.0837 +[2026-01-29T22:18:58.316641Z] Loop 2711: Loss: 1.14e-03, Avg Return: 0.456, Regret: 0.3510, Entropy: 0.0830 +[2026-01-29T22:18:59.477490Z] Loop 2712: Loss: 1.00e-03, Avg Return: 0.457, Regret: 0.3510, Entropy: 0.0841 +[2026-01-29T22:19:00.643207Z] Loop 2713: Loss: 1.02e-03, Avg Return: 0.451, Regret: 0.3510, Entropy: 0.0838 +[2026-01-29T22:19:01.802351Z] Loop 2714: Loss: 1.08e-03, Avg Return: 0.450, Regret: 0.3510, Entropy: 0.0825 +[2026-01-29T22:19:02.962336Z] Loop 2715: Loss: 1.38e-03, Avg Return: 0.455, Regret: 0.3510, Entropy: 0.0900 +[2026-01-29T22:19:04.123357Z] Loop 2716: Loss: 1.52e-03, Avg Return: 0.461, Regret: 0.3510, Entropy: 0.0822 +[2026-01-29T22:19:05.289372Z] Loop 2717: Loss: 1.58e-03, Avg Return: 0.459, Regret: 0.3510, Entropy: 0.0889 +[2026-01-29T22:19:06.451854Z] Loop 2718: Loss: 1.67e-03, Avg Return: 0.457, Regret: 0.3510, Entropy: 0.0858 +[2026-01-29T22:19:07.612726Z] Loop 2719: Loss: 1.73e-03, Avg Return: 0.446, Regret: 0.3510, Entropy: 0.0986 +[2026-01-29T22:19:08.828429Z] Loop 2720: Loss: 1.89e-03, Avg Return: 0.453, Regret: 0.3507, Entropy: 0.0974 +[2026-01-29T22:19:09.991219Z] Loop 2721: Loss: 1.85e-03, Avg Return: 0.455, Regret: 0.3507, Entropy: 0.0933 +[2026-01-29T22:19:11.154308Z] Loop 2722: Loss: 2.09e-03, Avg Return: 0.453, Regret: 0.3507, Entropy: 0.0969 +[2026-01-29T22:19:12.317421Z] Loop 2723: Loss: 2.22e-03, Avg Return: 0.454, Regret: 0.3507, Entropy: 0.0962 +[2026-01-29T22:19:13.478015Z] Loop 2724: Loss: 2.03e-03, Avg Return: 0.449, Regret: 0.3507, Entropy: 0.0964 +[2026-01-29T22:19:14.639434Z] Loop 2725: Loss: 2.03e-03, Avg Return: 0.449, Regret: 0.3507, Entropy: 0.1020 +[2026-01-29T22:19:15.799525Z] Loop 2726: Loss: 2.35e-03, Avg Return: 0.454, Regret: 0.3507, Entropy: 0.0999 +[2026-01-29T22:19:16.959921Z] Loop 2727: Loss: 2.85e-03, Avg Return: 0.454, Regret: 0.3507, Entropy: 0.1040 +[2026-01-29T22:19:18.121652Z] Loop 2728: Loss: 2.39e-03, Avg Return: 0.457, Regret: 0.3507, Entropy: 0.1051 +[2026-01-29T22:19:19.281812Z] Loop 2729: Loss: 2.49e-03, Avg Return: 0.458, Regret: 0.3507, Entropy: 0.0935 +[2026-01-29T22:19:20.489399Z] Loop 2730: Loss: 2.72e-03, Avg Return: 0.448, Regret: 0.3517, Entropy: 0.1045 +[2026-01-29T22:19:21.650655Z] Loop 2731: Loss: 2.30e-03, Avg Return: 0.451, Regret: 0.3517, Entropy: 0.1012 +[2026-01-29T22:19:22.812023Z] Loop 2732: Loss: 2.37e-03, Avg Return: 0.454, Regret: 0.3517, Entropy: 0.1027 +[2026-01-29T22:19:23.972226Z] Loop 2733: Loss: 2.29e-03, Avg Return: 0.452, Regret: 0.3517, Entropy: 0.1036 +[2026-01-29T22:19:25.133630Z] Loop 2734: Loss: 2.28e-03, Avg Return: 0.449, Regret: 0.3517, Entropy: 0.1028 +[2026-01-29T22:19:26.294658Z] Loop 2735: Loss: 2.01e-03, Avg Return: 0.458, Regret: 0.3517, Entropy: 0.0901 +[2026-01-29T22:19:27.456649Z] Loop 2736: Loss: 1.70e-03, Avg Return: 0.455, Regret: 0.3517, Entropy: 0.0928 +[2026-01-29T22:19:28.618520Z] Loop 2737: Loss: 1.80e-03, Avg Return: 0.451, Regret: 0.3517, Entropy: 0.0975 +[2026-01-29T22:19:29.778455Z] Loop 2738: Loss: 1.78e-03, Avg Return: 0.454, Regret: 0.3517, Entropy: 0.0936 +[2026-01-29T22:19:30.940355Z] Loop 2739: Loss: 1.74e-03, Avg Return: 0.444, Regret: 0.3517, Entropy: 0.0977 +[2026-01-29T22:19:32.148286Z] Loop 2740: Loss: 1.90e-03, Avg Return: 0.458, Regret: 0.3508, Entropy: 0.0893 +[2026-01-29T22:19:33.310245Z] Loop 2741: Loss: 1.66e-03, Avg Return: 0.456, Regret: 0.3508, Entropy: 0.0861 +[2026-01-29T22:19:34.471052Z] Loop 2742: Loss: 1.49e-03, Avg Return: 0.448, Regret: 0.3508, Entropy: 0.0922 +[2026-01-29T22:19:35.632134Z] Loop 2743: Loss: 1.56e-03, Avg Return: 0.460, Regret: 0.3508, Entropy: 0.0870 +[2026-01-29T22:19:36.792595Z] Loop 2744: Loss: 1.58e-03, Avg Return: 0.457, Regret: 0.3508, Entropy: 0.0839 +[2026-01-29T22:19:37.956579Z] Loop 2745: Loss: 1.73e-03, Avg Return: 0.462, Regret: 0.3508, Entropy: 0.0861 +[2026-01-29T22:19:39.118565Z] Loop 2746: Loss: 1.54e-03, Avg Return: 0.459, Regret: 0.3508, Entropy: 0.0850 +[2026-01-29T22:19:40.279141Z] Loop 2747: Loss: 1.74e-03, Avg Return: 0.459, Regret: 0.3508, Entropy: 0.0891 +[2026-01-29T22:19:41.441878Z] Loop 2748: Loss: 1.55e-03, Avg Return: 0.453, Regret: 0.3508, Entropy: 0.0876 +[2026-01-29T22:19:42.605069Z] Loop 2749: Loss: 1.74e-03, Avg Return: 0.457, Regret: 0.3508, Entropy: 0.0942 +[2026-01-29T22:19:43.820090Z] Loop 2750: Loss: 1.73e-03, Avg Return: 0.450, Regret: 0.3509, Entropy: 0.0916 +[2026-01-29T22:19:44.981265Z] Loop 2751: Loss: 1.66e-03, Avg Return: 0.451, Regret: 0.3509, Entropy: 0.0887 +[2026-01-29T22:19:46.142595Z] Loop 2752: Loss: 1.71e-03, Avg Return: 0.453, Regret: 0.3509, Entropy: 0.0929 +[2026-01-29T22:19:47.305737Z] Loop 2753: Loss: 1.69e-03, Avg Return: 0.456, Regret: 0.3509, Entropy: 0.0926 +[2026-01-29T22:19:48.466962Z] Loop 2754: Loss: 1.76e-03, Avg Return: 0.453, Regret: 0.3509, Entropy: 0.0956 +[2026-01-29T22:19:49.629130Z] Loop 2755: Loss: 1.84e-03, Avg Return: 0.454, Regret: 0.3509, Entropy: 0.0899 +[2026-01-29T22:19:50.789261Z] Loop 2756: Loss: 1.98e-03, Avg Return: 0.459, Regret: 0.3509, Entropy: 0.0919 +[2026-01-29T22:19:51.950592Z] Loop 2757: Loss: 1.97e-03, Avg Return: 0.456, Regret: 0.3509, Entropy: 0.0884 +[2026-01-29T22:19:53.111594Z] Loop 2758: Loss: 1.94e-03, Avg Return: 0.452, Regret: 0.3509, Entropy: 0.0918 +[2026-01-29T22:19:54.271825Z] Loop 2759: Loss: 1.91e-03, Avg Return: 0.453, Regret: 0.3509, Entropy: 0.0941 +[2026-01-29T22:19:55.481298Z] Loop 2760: Loss: 1.85e-03, Avg Return: 0.451, Regret: 0.3509, Entropy: 0.0931 +[2026-01-29T22:19:56.641963Z] Loop 2761: Loss: 1.97e-03, Avg Return: 0.458, Regret: 0.3509, Entropy: 0.0933 +[2026-01-29T22:19:57.803248Z] Loop 2762: Loss: 1.65e-03, Avg Return: 0.455, Regret: 0.3509, Entropy: 0.0926 +[2026-01-29T22:19:58.963003Z] Loop 2763: Loss: 1.83e-03, Avg Return: 0.450, Regret: 0.3509, Entropy: 0.0900 +[2026-01-29T22:20:00.124364Z] Loop 2764: Loss: 1.75e-03, Avg Return: 0.453, Regret: 0.3509, Entropy: 0.0865 +[2026-01-29T22:20:01.290587Z] Loop 2765: Loss: 1.47e-03, Avg Return: 0.457, Regret: 0.3509, Entropy: 0.0899 +[2026-01-29T22:20:02.451763Z] Loop 2766: Loss: 1.43e-03, Avg Return: 0.448, Regret: 0.3509, Entropy: 0.0843 +[2026-01-29T22:20:03.614332Z] Loop 2767: Loss: 1.67e-03, Avg Return: 0.459, Regret: 0.3509, Entropy: 0.0865 +[2026-01-29T22:20:04.774515Z] Loop 2768: Loss: 1.69e-03, Avg Return: 0.457, Regret: 0.3509, Entropy: 0.0900 +[2026-01-29T22:20:05.935424Z] Loop 2769: Loss: 1.61e-03, Avg Return: 0.452, Regret: 0.3509, Entropy: 0.0924 +[2026-01-29T22:20:07.142421Z] Loop 2770: Loss: 1.56e-03, Avg Return: 0.448, Regret: 0.3510, Entropy: 0.0897 +[2026-01-29T22:20:08.304182Z] Loop 2771: Loss: 1.86e-03, Avg Return: 0.451, Regret: 0.3510, Entropy: 0.0897 +[2026-01-29T22:20:09.465539Z] Loop 2772: Loss: 1.68e-03, Avg Return: 0.456, Regret: 0.3510, Entropy: 0.0933 +[2026-01-29T22:20:10.625494Z] Loop 2773: Loss: 1.69e-03, Avg Return: 0.459, Regret: 0.3510, Entropy: 0.0878 +[2026-01-29T22:20:11.787129Z] Loop 2774: Loss: 1.74e-03, Avg Return: 0.451, Regret: 0.3510, Entropy: 0.0929 +[2026-01-29T22:20:12.947744Z] Loop 2775: Loss: 1.59e-03, Avg Return: 0.448, Regret: 0.3510, Entropy: 0.0918 +[2026-01-29T22:20:14.109328Z] Loop 2776: Loss: 1.55e-03, Avg Return: 0.456, Regret: 0.3510, Entropy: 0.0895 +[2026-01-29T22:20:15.269448Z] Loop 2777: Loss: 1.35e-03, Avg Return: 0.458, Regret: 0.3510, Entropy: 0.0890 +[2026-01-29T22:20:16.430698Z] Loop 2778: Loss: 1.46e-03, Avg Return: 0.454, Regret: 0.3510, Entropy: 0.0893 +[2026-01-29T22:20:17.591176Z] Loop 2779: Loss: 1.54e-03, Avg Return: 0.455, Regret: 0.3510, Entropy: 0.0801 +[2026-01-29T22:20:18.800129Z] Loop 2780: Loss: 2.08e-03, Avg Return: 0.450, Regret: 0.3508, Entropy: 0.0845 +[2026-01-29T22:20:19.961381Z] Loop 2781: Loss: 2.12e-03, Avg Return: 0.441, Regret: 0.3508, Entropy: 0.0875 +[2026-01-29T22:20:21.121993Z] Loop 2782: Loss: 2.50e-03, Avg Return: 0.451, Regret: 0.3508, Entropy: 0.0874 +[2026-01-29T22:20:22.281838Z] Loop 2783: Loss: 2.40e-03, Avg Return: 0.454, Regret: 0.3508, Entropy: 0.0828 +[2026-01-29T22:20:23.442668Z] Loop 2784: Loss: 2.18e-03, Avg Return: 0.452, Regret: 0.3508, Entropy: 0.0827 +[2026-01-29T22:20:24.604736Z] Loop 2785: Loss: 2.77e-03, Avg Return: 0.459, Regret: 0.3508, Entropy: 0.0808 +[2026-01-29T22:20:25.764325Z] Loop 2786: Loss: 2.65e-03, Avg Return: 0.450, Regret: 0.3508, Entropy: 0.0806 +[2026-01-29T22:20:26.925545Z] Loop 2787: Loss: 2.29e-03, Avg Return: 0.451, Regret: 0.3508, Entropy: 0.0779 +[2026-01-29T22:20:28.086063Z] Loop 2788: Loss: 2.47e-03, Avg Return: 0.455, Regret: 0.3508, Entropy: 0.0761 +[2026-01-29T22:20:29.247279Z] Loop 2789: Loss: 2.28e-03, Avg Return: 0.456, Regret: 0.3508, Entropy: 0.0747 +[2026-01-29T22:20:30.458821Z] Loop 2790: Loss: 2.37e-03, Avg Return: 0.459, Regret: 0.3511, Entropy: 0.0762 +[2026-01-29T22:20:31.619955Z] Loop 2791: Loss: 2.11e-03, Avg Return: 0.443, Regret: 0.3511, Entropy: 0.0753 +[2026-01-29T22:20:32.781470Z] Loop 2792: Loss: 2.59e-03, Avg Return: 0.451, Regret: 0.3511, Entropy: 0.0778 +[2026-01-29T22:20:33.942981Z] Loop 2793: Loss: 2.46e-03, Avg Return: 0.462, Regret: 0.3511, Entropy: 0.0735 +[2026-01-29T22:20:35.103711Z] Loop 2794: Loss: 2.43e-03, Avg Return: 0.459, Regret: 0.3511, Entropy: 0.0731 +[2026-01-29T22:20:36.263711Z] Loop 2795: Loss: 2.55e-03, Avg Return: 0.451, Regret: 0.3511, Entropy: 0.0782 +[2026-01-29T22:20:37.424918Z] Loop 2796: Loss: 2.72e-03, Avg Return: 0.451, Regret: 0.3511, Entropy: 0.0740 +[2026-01-29T22:20:38.584818Z] Loop 2797: Loss: 2.74e-03, Avg Return: 0.445, Regret: 0.3511, Entropy: 0.0809 +[2026-01-29T22:20:39.745670Z] Loop 2798: Loss: 3.39e-03, Avg Return: 0.456, Regret: 0.3511, Entropy: 0.0882 +[2026-01-29T22:20:40.907173Z] Loop 2799: Loss: 3.37e-03, Avg Return: 0.451, Regret: 0.3511, Entropy: 0.0923 +[2026-01-29T22:20:42.113200Z] Loop 2800: Loss: 3.57e-03, Avg Return: 0.458, Regret: 0.3527, Entropy: 0.0918 +[2026-01-29T22:20:43.276250Z] Loop 2801: Loss: 3.80e-03, Avg Return: 0.450, Regret: 0.3527, Entropy: 0.0905 +[2026-01-29T22:20:44.437794Z] Loop 2802: Loss: 3.29e-03, Avg Return: 0.452, Regret: 0.3527, Entropy: 0.0824 +[2026-01-29T22:20:45.601113Z] Loop 2803: Loss: 3.08e-03, Avg Return: 0.459, Regret: 0.3527, Entropy: 0.0825 +[2026-01-29T22:20:46.762654Z] Loop 2804: Loss: 2.87e-03, Avg Return: 0.452, Regret: 0.3527, Entropy: 0.0795 +[2026-01-29T22:20:47.924987Z] Loop 2805: Loss: 3.07e-03, Avg Return: 0.455, Regret: 0.3527, Entropy: 0.0786 +[2026-01-29T22:20:49.087938Z] Loop 2806: Loss: 2.68e-03, Avg Return: 0.458, Regret: 0.3527, Entropy: 0.0774 +[2026-01-29T22:20:50.249237Z] Loop 2807: Loss: 2.23e-03, Avg Return: 0.454, Regret: 0.3527, Entropy: 0.0810 +[2026-01-29T22:20:51.412237Z] Loop 2808: Loss: 2.43e-03, Avg Return: 0.454, Regret: 0.3527, Entropy: 0.0736 +[2026-01-29T22:20:52.572412Z] Loop 2809: Loss: 2.06e-03, Avg Return: 0.447, Regret: 0.3527, Entropy: 0.0715 +[2026-01-29T22:20:53.776992Z] Loop 2810: Loss: 1.89e-03, Avg Return: 0.448, Regret: 0.3508, Entropy: 0.0762 +[2026-01-29T22:20:54.936272Z] Loop 2811: Loss: 1.81e-03, Avg Return: 0.449, Regret: 0.3508, Entropy: 0.0735 +[2026-01-29T22:20:56.097278Z] Loop 2812: Loss: 1.79e-03, Avg Return: 0.455, Regret: 0.3508, Entropy: 0.0771 +[2026-01-29T22:20:57.257537Z] Loop 2813: Loss: 1.68e-03, Avg Return: 0.443, Regret: 0.3508, Entropy: 0.0822 +[2026-01-29T22:20:58.417876Z] Loop 2814: Loss: 1.90e-03, Avg Return: 0.456, Regret: 0.3508, Entropy: 0.0794 +[2026-01-29T22:20:59.577531Z] Loop 2815: Loss: 2.01e-03, Avg Return: 0.459, Regret: 0.3508, Entropy: 0.0805 +[2026-01-29T22:21:00.738382Z] Loop 2816: Loss: 1.90e-03, Avg Return: 0.453, Regret: 0.3508, Entropy: 0.0844 +[2026-01-29T22:21:01.904397Z] Loop 2817: Loss: 2.06e-03, Avg Return: 0.455, Regret: 0.3508, Entropy: 0.0836 +[2026-01-29T22:21:03.064908Z] Loop 2818: Loss: 1.71e-03, Avg Return: 0.447, Regret: 0.3508, Entropy: 0.0860 +[2026-01-29T22:21:04.225276Z] Loop 2819: Loss: 1.90e-03, Avg Return: 0.458, Regret: 0.3508, Entropy: 0.0789 +[2026-01-29T22:21:05.433879Z] Loop 2820: Loss: 1.98e-03, Avg Return: 0.449, Regret: 0.3507, Entropy: 0.0836 +[2026-01-29T22:21:06.596255Z] Loop 2821: Loss: 1.91e-03, Avg Return: 0.448, Regret: 0.3507, Entropy: 0.0813 +[2026-01-29T22:21:07.757728Z] Loop 2822: Loss: 1.93e-03, Avg Return: 0.458, Regret: 0.3507, Entropy: 0.0794 +[2026-01-29T22:21:08.919530Z] Loop 2823: Loss: 1.86e-03, Avg Return: 0.455, Regret: 0.3507, Entropy: 0.0792 +[2026-01-29T22:21:10.081875Z] Loop 2824: Loss: 2.04e-03, Avg Return: 0.451, Regret: 0.3507, Entropy: 0.0808 +[2026-01-29T22:21:11.243628Z] Loop 2825: Loss: 2.24e-03, Avg Return: 0.453, Regret: 0.3507, Entropy: 0.0806 +[2026-01-29T22:21:12.406657Z] Loop 2826: Loss: 1.90e-03, Avg Return: 0.443, Regret: 0.3507, Entropy: 0.0800 +[2026-01-29T22:21:13.567924Z] Loop 2827: Loss: 2.09e-03, Avg Return: 0.450, Regret: 0.3507, Entropy: 0.0856 +[2026-01-29T22:21:14.729297Z] Loop 2828: Loss: 1.87e-03, Avg Return: 0.444, Regret: 0.3507, Entropy: 0.0906 +[2026-01-29T22:21:15.892260Z] Loop 2829: Loss: 1.89e-03, Avg Return: 0.458, Regret: 0.3507, Entropy: 0.0844 +[2026-01-29T22:21:17.100493Z] Loop 2830: Loss: 1.60e-03, Avg Return: 0.453, Regret: 0.3508, Entropy: 0.0823 +[2026-01-29T22:21:18.263972Z] Loop 2831: Loss: 1.28e-03, Avg Return: 0.451, Regret: 0.3508, Entropy: 0.0864 +[2026-01-29T22:21:19.424972Z] Loop 2832: Loss: 1.16e-03, Avg Return: 0.452, Regret: 0.3508, Entropy: 0.0924 +[2026-01-29T22:21:20.586900Z] Loop 2833: Loss: 1.28e-03, Avg Return: 0.449, Regret: 0.3508, Entropy: 0.0853 +[2026-01-29T22:21:21.747755Z] Loop 2834: Loss: 1.57e-03, Avg Return: 0.457, Regret: 0.3508, Entropy: 0.0790 +[2026-01-29T22:21:22.911866Z] Loop 2835: Loss: 1.78e-03, Avg Return: 0.445, Regret: 0.3508, Entropy: 0.0826 +[2026-01-29T22:21:24.073908Z] Loop 2836: Loss: 1.74e-03, Avg Return: 0.455, Regret: 0.3508, Entropy: 0.0822 +[2026-01-29T22:21:25.233911Z] Loop 2837: Loss: 1.54e-03, Avg Return: 0.451, Regret: 0.3508, Entropy: 0.0862 +[2026-01-29T22:21:26.395347Z] Loop 2838: Loss: 1.37e-03, Avg Return: 0.458, Regret: 0.3508, Entropy: 0.0768 +[2026-01-29T22:21:27.557142Z] Loop 2839: Loss: 1.13e-03, Avg Return: 0.459, Regret: 0.3508, Entropy: 0.0763 +[2026-01-29T22:21:28.768278Z] Loop 2840: Loss: 7.56e-04, Avg Return: 0.450, Regret: 0.3518, Entropy: 0.0711 +[2026-01-29T22:21:29.929671Z] Loop 2841: Loss: 1.02e-03, Avg Return: 0.461, Regret: 0.3518, Entropy: 0.0715 +[2026-01-29T22:21:31.091192Z] Loop 2842: Loss: 1.46e-03, Avg Return: 0.454, Regret: 0.3518, Entropy: 0.0765 +[2026-01-29T22:21:32.252065Z] Loop 2843: Loss: 1.56e-03, Avg Return: 0.447, Regret: 0.3518, Entropy: 0.0864 +[2026-01-29T22:21:33.414976Z] Loop 2844: Loss: 2.05e-03, Avg Return: 0.453, Regret: 0.3518, Entropy: 0.0896 +[2026-01-29T22:21:34.577258Z] Loop 2845: Loss: 2.55e-03, Avg Return: 0.452, Regret: 0.3518, Entropy: 0.0953 +[2026-01-29T22:21:35.738102Z] Loop 2846: Loss: 2.65e-03, Avg Return: 0.441, Regret: 0.3518, Entropy: 0.1019 +[2026-01-29T22:21:36.899859Z] Loop 2847: Loss: 2.97e-03, Avg Return: 0.449, Regret: 0.3518, Entropy: 0.0982 +[2026-01-29T22:21:38.059906Z] Loop 2848: Loss: 3.04e-03, Avg Return: 0.442, Regret: 0.3518, Entropy: 0.1003 +[2026-01-29T22:21:39.220936Z] Loop 2849: Loss: 2.78e-03, Avg Return: 0.449, Regret: 0.3518, Entropy: 0.1026 +[2026-01-29T22:21:40.433731Z] Loop 2850: Loss: 2.94e-03, Avg Return: 0.456, Regret: 0.3538, Entropy: 0.0935 +[2026-01-29T22:21:41.595821Z] Loop 2851: Loss: 2.46e-03, Avg Return: 0.451, Regret: 0.3538, Entropy: 0.0966 +[2026-01-29T22:21:42.758158Z] Loop 2852: Loss: 2.16e-03, Avg Return: 0.452, Regret: 0.3538, Entropy: 0.0921 +[2026-01-29T22:21:43.919411Z] Loop 2853: Loss: 1.94e-03, Avg Return: 0.452, Regret: 0.3538, Entropy: 0.0874 +[2026-01-29T22:21:45.080467Z] Loop 2854: Loss: 1.77e-03, Avg Return: 0.453, Regret: 0.3538, Entropy: 0.0825 +[2026-01-29T22:21:46.240091Z] Loop 2855: Loss: 1.35e-03, Avg Return: 0.449, Regret: 0.3538, Entropy: 0.0767 +[2026-01-29T22:21:47.400409Z] Loop 2856: Loss: 1.06e-03, Avg Return: 0.452, Regret: 0.3538, Entropy: 0.0741 +[2026-01-29T22:21:48.560315Z] Loop 2857: Loss: 1.02e-03, Avg Return: 0.451, Regret: 0.3538, Entropy: 0.0777 +[2026-01-29T22:21:49.721148Z] Loop 2858: Loss: 8.50e-04, Avg Return: 0.453, Regret: 0.3538, Entropy: 0.0806 +[2026-01-29T22:21:50.883675Z] Loop 2859: Loss: 1.17e-03, Avg Return: 0.453, Regret: 0.3538, Entropy: 0.0771 +[2026-01-29T22:21:52.091383Z] Loop 2860: Loss: 1.14e-03, Avg Return: 0.449, Regret: 0.3509, Entropy: 0.0810 +[2026-01-29T22:21:53.253325Z] Loop 2861: Loss: 1.13e-03, Avg Return: 0.452, Regret: 0.3509, Entropy: 0.0871 +[2026-01-29T22:21:54.414055Z] Loop 2862: Loss: 1.48e-03, Avg Return: 0.452, Regret: 0.3509, Entropy: 0.0838 +[2026-01-29T22:21:55.579296Z] Loop 2863: Loss: 1.60e-03, Avg Return: 0.444, Regret: 0.3509, Entropy: 0.0927 +[2026-01-29T22:21:56.739617Z] Loop 2864: Loss: 1.81e-03, Avg Return: 0.454, Regret: 0.3509, Entropy: 0.0949 +[2026-01-29T22:21:57.900229Z] Loop 2865: Loss: 1.70e-03, Avg Return: 0.453, Regret: 0.3509, Entropy: 0.0984 +[2026-01-29T22:21:59.062298Z] Loop 2866: Loss: 1.99e-03, Avg Return: 0.457, Regret: 0.3509, Entropy: 0.0957 +[2026-01-29T22:22:00.224117Z] Loop 2867: Loss: 1.87e-03, Avg Return: 0.450, Regret: 0.3509, Entropy: 0.0896 +[2026-01-29T22:22:01.385927Z] Loop 2868: Loss: 2.00e-03, Avg Return: 0.459, Regret: 0.3509, Entropy: 0.0873 +[2026-01-29T22:22:02.546228Z] Loop 2869: Loss: 1.88e-03, Avg Return: 0.456, Regret: 0.3509, Entropy: 0.0889 +[2026-01-29T22:22:03.755120Z] Loop 2870: Loss: 2.00e-03, Avg Return: 0.444, Regret: 0.3507, Entropy: 0.0896 +[2026-01-29T22:22:04.915640Z] Loop 2871: Loss: 1.72e-03, Avg Return: 0.454, Regret: 0.3507, Entropy: 0.0903 +[2026-01-29T22:22:06.075741Z] Loop 2872: Loss: 1.70e-03, Avg Return: 0.453, Regret: 0.3507, Entropy: 0.0885 +[2026-01-29T22:22:07.234622Z] Loop 2873: Loss: 1.80e-03, Avg Return: 0.453, Regret: 0.3507, Entropy: 0.0859 +[2026-01-29T22:22:08.394300Z] Loop 2874: Loss: 1.67e-03, Avg Return: 0.456, Regret: 0.3507, Entropy: 0.0886 +[2026-01-29T22:22:09.554789Z] Loop 2875: Loss: 1.70e-03, Avg Return: 0.443, Regret: 0.3507, Entropy: 0.0924 +[2026-01-29T22:22:10.714697Z] Loop 2876: Loss: 2.03e-03, Avg Return: 0.457, Regret: 0.3507, Entropy: 0.0878 +[2026-01-29T22:22:11.875084Z] Loop 2877: Loss: 1.80e-03, Avg Return: 0.450, Regret: 0.3507, Entropy: 0.0933 +[2026-01-29T22:22:13.033789Z] Loop 2878: Loss: 1.71e-03, Avg Return: 0.454, Regret: 0.3507, Entropy: 0.0894 +[2026-01-29T22:22:14.194434Z] Loop 2879: Loss: 1.59e-03, Avg Return: 0.451, Regret: 0.3507, Entropy: 0.0879 +[2026-01-29T22:22:15.399191Z] Loop 2880: Loss: 1.64e-03, Avg Return: 0.452, Regret: 0.3507, Entropy: 0.0900 +[2026-01-29T22:22:16.561231Z] Loop 2881: Loss: 1.24e-03, Avg Return: 0.453, Regret: 0.3507, Entropy: 0.0880 +[2026-01-29T22:22:17.721644Z] Loop 2882: Loss: 1.08e-03, Avg Return: 0.448, Regret: 0.3507, Entropy: 0.0835 +[2026-01-29T22:22:18.883080Z] Loop 2883: Loss: 9.71e-04, Avg Return: 0.452, Regret: 0.3507, Entropy: 0.0789 +[2026-01-29T22:22:20.043393Z] Loop 2884: Loss: 9.99e-04, Avg Return: 0.449, Regret: 0.3507, Entropy: 0.0798 +[2026-01-29T22:22:21.204641Z] Loop 2885: Loss: 1.32e-03, Avg Return: 0.454, Regret: 0.3507, Entropy: 0.0857 +[2026-01-29T22:22:22.366610Z] Loop 2886: Loss: 1.46e-03, Avg Return: 0.447, Regret: 0.3507, Entropy: 0.0867 +[2026-01-29T22:22:23.527265Z] Loop 2887: Loss: 1.62e-03, Avg Return: 0.455, Regret: 0.3507, Entropy: 0.0910 +[2026-01-29T22:22:24.688695Z] Loop 2888: Loss: 1.88e-03, Avg Return: 0.454, Regret: 0.3507, Entropy: 0.0915 +[2026-01-29T22:22:25.848949Z] Loop 2889: Loss: 1.64e-03, Avg Return: 0.452, Regret: 0.3507, Entropy: 0.0953 +[2026-01-29T22:22:27.059100Z] Loop 2890: Loss: 1.73e-03, Avg Return: 0.452, Regret: 0.3514, Entropy: 0.0889 +[2026-01-29T22:22:28.219578Z] Loop 2891: Loss: 1.78e-03, Avg Return: 0.456, Regret: 0.3514, Entropy: 0.0923 +[2026-01-29T22:22:29.381977Z] Loop 2892: Loss: 1.85e-03, Avg Return: 0.455, Regret: 0.3514, Entropy: 0.0919 +[2026-01-29T22:22:30.542692Z] Loop 2893: Loss: 1.61e-03, Avg Return: 0.451, Regret: 0.3514, Entropy: 0.0913 +[2026-01-29T22:22:31.704555Z] Loop 2894: Loss: 2.02e-03, Avg Return: 0.452, Regret: 0.3514, Entropy: 0.0901 +[2026-01-29T22:22:32.867350Z] Loop 2895: Loss: 1.58e-03, Avg Return: 0.458, Regret: 0.3514, Entropy: 0.0870 +[2026-01-29T22:22:34.028385Z] Loop 2896: Loss: 1.49e-03, Avg Return: 0.460, Regret: 0.3514, Entropy: 0.0783 +[2026-01-29T22:22:35.190489Z] Loop 2897: Loss: 1.07e-03, Avg Return: 0.448, Regret: 0.3514, Entropy: 0.0820 +[2026-01-29T22:22:36.351236Z] Loop 2898: Loss: 1.05e-03, Avg Return: 0.448, Regret: 0.3514, Entropy: 0.0777 +[2026-01-29T22:22:37.512669Z] Loop 2899: Loss: 8.55e-04, Avg Return: 0.454, Regret: 0.3514, Entropy: 0.0780 +[2026-01-29T22:22:38.731107Z] Loop 2900: Loss: 8.71e-04, Avg Return: 0.453, Regret: 0.3511, Entropy: 0.0781 +[2026-01-29T22:22:39.891916Z] Loop 2901: Loss: 8.86e-04, Avg Return: 0.453, Regret: 0.3511, Entropy: 0.0762 +[2026-01-29T22:22:41.052788Z] Loop 2902: Loss: 8.46e-04, Avg Return: 0.457, Regret: 0.3511, Entropy: 0.0770 +[2026-01-29T22:22:42.213116Z] Loop 2903: Loss: 9.42e-04, Avg Return: 0.454, Regret: 0.3511, Entropy: 0.0764 +[2026-01-29T22:22:43.375176Z] Loop 2904: Loss: 7.92e-04, Avg Return: 0.448, Regret: 0.3511, Entropy: 0.0817 +[2026-01-29T22:22:44.536845Z] Loop 2905: Loss: 9.03e-04, Avg Return: 0.453, Regret: 0.3511, Entropy: 0.0766 +[2026-01-29T22:22:45.698742Z] Loop 2906: Loss: 7.88e-04, Avg Return: 0.455, Regret: 0.3511, Entropy: 0.0800 +[2026-01-29T22:22:46.860905Z] Loop 2907: Loss: 7.90e-04, Avg Return: 0.452, Regret: 0.3511, Entropy: 0.0788 +[2026-01-29T22:22:48.022171Z] Loop 2908: Loss: 8.99e-04, Avg Return: 0.454, Regret: 0.3511, Entropy: 0.0780 +[2026-01-29T22:22:49.183497Z] Loop 2909: Loss: 1.06e-03, Avg Return: 0.455, Regret: 0.3511, Entropy: 0.0813 +[2026-01-29T22:22:50.397935Z] Loop 2910: Loss: 1.16e-03, Avg Return: 0.460, Regret: 0.3508, Entropy: 0.0850 +[2026-01-29T22:22:51.559044Z] Loop 2911: Loss: 1.12e-03, Avg Return: 0.452, Regret: 0.3508, Entropy: 0.0824 +[2026-01-29T22:22:52.717948Z] Loop 2912: Loss: 1.20e-03, Avg Return: 0.444, Regret: 0.3508, Entropy: 0.0835 +[2026-01-29T22:22:53.879065Z] Loop 2913: Loss: 1.44e-03, Avg Return: 0.462, Regret: 0.3508, Entropy: 0.0806 +[2026-01-29T22:22:55.040103Z] Loop 2914: Loss: 1.35e-03, Avg Return: 0.453, Regret: 0.3508, Entropy: 0.0940 +[2026-01-29T22:22:56.200337Z] Loop 2915: Loss: 1.64e-03, Avg Return: 0.456, Regret: 0.3508, Entropy: 0.0858 +[2026-01-29T22:22:57.361753Z] Loop 2916: Loss: 1.68e-03, Avg Return: 0.453, Regret: 0.3508, Entropy: 0.0899 +[2026-01-29T22:22:58.521636Z] Loop 2917: Loss: 1.51e-03, Avg Return: 0.457, Regret: 0.3508, Entropy: 0.0919 +[2026-01-29T22:22:59.687436Z] Loop 2918: Loss: 1.95e-03, Avg Return: 0.461, Regret: 0.3508, Entropy: 0.0893 +[2026-01-29T22:23:00.849896Z] Loop 2919: Loss: 1.70e-03, Avg Return: 0.457, Regret: 0.3508, Entropy: 0.0941 +[2026-01-29T22:23:02.062398Z] Loop 2920: Loss: 2.04e-03, Avg Return: 0.455, Regret: 0.3507, Entropy: 0.0934 +[2026-01-29T22:23:03.225015Z] Loop 2921: Loss: 1.84e-03, Avg Return: 0.451, Regret: 0.3507, Entropy: 0.0923 +[2026-01-29T22:23:04.389069Z] Loop 2922: Loss: 1.61e-03, Avg Return: 0.443, Regret: 0.3507, Entropy: 0.0916 +[2026-01-29T22:23:05.550762Z] Loop 2923: Loss: 1.70e-03, Avg Return: 0.449, Regret: 0.3507, Entropy: 0.0911 +[2026-01-29T22:23:06.710635Z] Loop 2924: Loss: 1.90e-03, Avg Return: 0.446, Regret: 0.3507, Entropy: 0.0845 +[2026-01-29T22:23:07.872184Z] Loop 2925: Loss: 1.72e-03, Avg Return: 0.455, Regret: 0.3507, Entropy: 0.0850 +[2026-01-29T22:23:09.031866Z] Loop 2926: Loss: 2.01e-03, Avg Return: 0.453, Regret: 0.3507, Entropy: 0.0855 +[2026-01-29T22:23:10.191390Z] Loop 2927: Loss: 2.77e-03, Avg Return: 0.458, Regret: 0.3507, Entropy: 0.0858 +[2026-01-29T22:23:11.352619Z] Loop 2928: Loss: 2.76e-03, Avg Return: 0.446, Regret: 0.3507, Entropy: 0.0833 +[2026-01-29T22:23:12.512527Z] Loop 2929: Loss: 2.98e-03, Avg Return: 0.452, Regret: 0.3507, Entropy: 0.0816 +[2026-01-29T22:23:13.717140Z] Loop 2930: Loss: 3.44e-03, Avg Return: 0.452, Regret: 0.3523, Entropy: 0.0878 +[2026-01-29T22:23:14.879686Z] Loop 2931: Loss: 3.73e-03, Avg Return: 0.448, Regret: 0.3523, Entropy: 0.0966 +[2026-01-29T22:23:16.041301Z] Loop 2932: Loss: 3.77e-03, Avg Return: 0.443, Regret: 0.3523, Entropy: 0.0956 +[2026-01-29T22:23:17.201822Z] Loop 2933: Loss: 3.39e-03, Avg Return: 0.445, Regret: 0.3523, Entropy: 0.0955 +[2026-01-29T22:23:18.363962Z] Loop 2934: Loss: 3.41e-03, Avg Return: 0.445, Regret: 0.3523, Entropy: 0.0941 +[2026-01-29T22:23:19.527471Z] Loop 2935: Loss: 2.86e-03, Avg Return: 0.451, Regret: 0.3523, Entropy: 0.0881 +[2026-01-29T22:23:20.688301Z] Loop 2936: Loss: 3.15e-03, Avg Return: 0.453, Regret: 0.3523, Entropy: 0.0872 +[2026-01-29T22:23:21.849326Z] Loop 2937: Loss: 2.94e-03, Avg Return: 0.455, Regret: 0.3523, Entropy: 0.0841 +[2026-01-29T22:23:23.010187Z] Loop 2938: Loss: 2.91e-03, Avg Return: 0.451, Regret: 0.3523, Entropy: 0.0833 +[2026-01-29T22:23:24.172868Z] Loop 2939: Loss: 2.45e-03, Avg Return: 0.444, Regret: 0.3523, Entropy: 0.0784 +[2026-01-29T22:23:25.381301Z] Loop 2940: Loss: 2.49e-03, Avg Return: 0.442, Regret: 0.3565, Entropy: 0.0753 +[2026-01-29T22:23:26.542277Z] Loop 2941: Loss: 2.55e-03, Avg Return: 0.451, Regret: 0.3565, Entropy: 0.0747 +[2026-01-29T22:23:27.702574Z] Loop 2942: Loss: 2.58e-03, Avg Return: 0.448, Regret: 0.3565, Entropy: 0.0775 +[2026-01-29T22:23:28.865733Z] Loop 2943: Loss: 2.54e-03, Avg Return: 0.454, Regret: 0.3565, Entropy: 0.0761 +[2026-01-29T22:23:30.028522Z] Loop 2944: Loss: 2.23e-03, Avg Return: 0.448, Regret: 0.3565, Entropy: 0.0707 +[2026-01-29T22:23:31.189132Z] Loop 2945: Loss: 2.55e-03, Avg Return: 0.451, Regret: 0.3565, Entropy: 0.0732 +[2026-01-29T22:23:32.350608Z] Loop 2946: Loss: 2.67e-03, Avg Return: 0.454, Regret: 0.3565, Entropy: 0.0720 +[2026-01-29T22:23:33.510640Z] Loop 2947: Loss: 2.91e-03, Avg Return: 0.447, Regret: 0.3565, Entropy: 0.0763 +[2026-01-29T22:23:34.672364Z] Loop 2948: Loss: 2.78e-03, Avg Return: 0.448, Regret: 0.3565, Entropy: 0.0738 +[2026-01-29T22:23:35.832686Z] Loop 2949: Loss: 2.99e-03, Avg Return: 0.447, Regret: 0.3565, Entropy: 0.0789 +[2026-01-29T22:23:37.038638Z] Loop 2950: Loss: 3.19e-03, Avg Return: 0.456, Regret: 0.3511, Entropy: 0.0802 +[2026-01-29T22:23:38.199421Z] Loop 2951: Loss: 3.30e-03, Avg Return: 0.455, Regret: 0.3511, Entropy: 0.0841 +[2026-01-29T22:23:39.361853Z] Loop 2952: Loss: 3.10e-03, Avg Return: 0.452, Regret: 0.3511, Entropy: 0.0839 +[2026-01-29T22:23:40.523132Z] Loop 2953: Loss: 2.99e-03, Avg Return: 0.450, Regret: 0.3511, Entropy: 0.0808 +[2026-01-29T22:23:41.684471Z] Loop 2954: Loss: 2.79e-03, Avg Return: 0.453, Regret: 0.3511, Entropy: 0.0718 +[2026-01-29T22:23:42.846822Z] Loop 2955: Loss: 2.28e-03, Avg Return: 0.455, Regret: 0.3511, Entropy: 0.0637 +[2026-01-29T22:23:44.007465Z] Loop 2956: Loss: 2.25e-03, Avg Return: 0.454, Regret: 0.3511, Entropy: 0.0616 +[2026-01-29T22:23:45.169457Z] Loop 2957: Loss: 2.02e-03, Avg Return: 0.453, Regret: 0.3511, Entropy: 0.0612 +[2026-01-29T22:23:46.329989Z] Loop 2958: Loss: 2.18e-03, Avg Return: 0.450, Regret: 0.3511, Entropy: 0.0603 +[2026-01-29T22:23:47.491111Z] Loop 2959: Loss: 1.73e-03, Avg Return: 0.451, Regret: 0.3511, Entropy: 0.0585 +[2026-01-29T22:23:48.696618Z] Loop 2960: Loss: 1.72e-03, Avg Return: 0.450, Regret: 0.3514, Entropy: 0.0575 +[2026-01-29T22:23:49.859273Z] Loop 2961: Loss: 1.67e-03, Avg Return: 0.451, Regret: 0.3514, Entropy: 0.0578 +[2026-01-29T22:23:51.019430Z] Loop 2962: Loss: 1.56e-03, Avg Return: 0.455, Regret: 0.3514, Entropy: 0.0544 +[2026-01-29T22:23:52.180387Z] Loop 2963: Loss: 1.60e-03, Avg Return: 0.456, Regret: 0.3514, Entropy: 0.0571 +[2026-01-29T22:23:53.341815Z] Loop 2964: Loss: 1.64e-03, Avg Return: 0.451, Regret: 0.3514, Entropy: 0.0562 +[2026-01-29T22:23:54.502457Z] Loop 2965: Loss: 1.79e-03, Avg Return: 0.453, Regret: 0.3514, Entropy: 0.0608 +[2026-01-29T22:23:55.666756Z] Loop 2966: Loss: 1.86e-03, Avg Return: 0.451, Regret: 0.3514, Entropy: 0.0609 +[2026-01-29T22:23:56.826912Z] Loop 2967: Loss: 1.96e-03, Avg Return: 0.448, Regret: 0.3514, Entropy: 0.0624 +[2026-01-29T22:23:57.987180Z] Loop 2968: Loss: 2.12e-03, Avg Return: 0.458, Regret: 0.3514, Entropy: 0.0636 +[2026-01-29T22:23:59.149119Z] Loop 2969: Loss: 2.27e-03, Avg Return: 0.447, Regret: 0.3514, Entropy: 0.0619 +[2026-01-29T22:24:00.358896Z] Loop 2970: Loss: 1.78e-03, Avg Return: 0.453, Regret: 0.3512, Entropy: 0.0593 +[2026-01-29T22:24:01.521323Z] Loop 2971: Loss: 1.69e-03, Avg Return: 0.456, Regret: 0.3512, Entropy: 0.0583 +[2026-01-29T22:24:02.682655Z] Loop 2972: Loss: 1.47e-03, Avg Return: 0.442, Regret: 0.3512, Entropy: 0.0588 +[2026-01-29T22:24:03.844074Z] Loop 2973: Loss: 1.45e-03, Avg Return: 0.460, Regret: 0.3512, Entropy: 0.0569 +[2026-01-29T22:24:05.005174Z] Loop 2974: Loss: 1.50e-03, Avg Return: 0.455, Regret: 0.3512, Entropy: 0.0565 +[2026-01-29T22:24:06.168470Z] Loop 2975: Loss: 1.60e-03, Avg Return: 0.454, Regret: 0.3512, Entropy: 0.0524 +[2026-01-29T22:24:07.328816Z] Loop 2976: Loss: 1.42e-03, Avg Return: 0.448, Regret: 0.3512, Entropy: 0.0561 +[2026-01-29T22:24:08.490385Z] Loop 2977: Loss: 1.54e-03, Avg Return: 0.446, Regret: 0.3512, Entropy: 0.0554 +[2026-01-29T22:24:09.652694Z] Loop 2978: Loss: 1.81e-03, Avg Return: 0.454, Regret: 0.3512, Entropy: 0.0591 +[2026-01-29T22:24:10.814188Z] Loop 2979: Loss: 1.78e-03, Avg Return: 0.445, Regret: 0.3512, Entropy: 0.0612 +[2026-01-29T22:24:12.031690Z] Loop 2980: Loss: 2.21e-03, Avg Return: 0.458, Regret: 0.3511, Entropy: 0.0622 +[2026-01-29T22:24:13.200141Z] Loop 2981: Loss: 2.10e-03, Avg Return: 0.457, Regret: 0.3511, Entropy: 0.0632 +[2026-01-29T22:24:14.360633Z] Loop 2982: Loss: 2.40e-03, Avg Return: 0.448, Regret: 0.3511, Entropy: 0.0663 +[2026-01-29T22:24:15.522028Z] Loop 2983: Loss: 2.46e-03, Avg Return: 0.455, Regret: 0.3511, Entropy: 0.0705 +[2026-01-29T22:24:16.682585Z] Loop 2984: Loss: 2.48e-03, Avg Return: 0.457, Regret: 0.3511, Entropy: 0.0718 +[2026-01-29T22:24:17.843643Z] Loop 2985: Loss: 2.52e-03, Avg Return: 0.445, Regret: 0.3511, Entropy: 0.0772 +[2026-01-29T22:24:19.003640Z] Loop 2986: Loss: 2.64e-03, Avg Return: 0.454, Regret: 0.3511, Entropy: 0.0780 +[2026-01-29T22:24:20.163829Z] Loop 2987: Loss: 2.60e-03, Avg Return: 0.451, Regret: 0.3511, Entropy: 0.0830 +[2026-01-29T22:24:21.323073Z] Loop 2988: Loss: 2.61e-03, Avg Return: 0.450, Regret: 0.3511, Entropy: 0.0777 +[2026-01-29T22:24:22.482643Z] Loop 2989: Loss: 2.86e-03, Avg Return: 0.461, Regret: 0.3511, Entropy: 0.0796 +[2026-01-29T22:24:23.688147Z] Loop 2990: Loss: 2.72e-03, Avg Return: 0.451, Regret: 0.3511, Entropy: 0.0837 +[2026-01-29T22:24:24.852323Z] Loop 2991: Loss: 2.66e-03, Avg Return: 0.452, Regret: 0.3511, Entropy: 0.0827 +[2026-01-29T22:24:26.013807Z] Loop 2992: Loss: 2.11e-03, Avg Return: 0.453, Regret: 0.3511, Entropy: 0.0802 +[2026-01-29T22:24:27.174477Z] Loop 2993: Loss: 1.63e-03, Avg Return: 0.454, Regret: 0.3511, Entropy: 0.0805 +[2026-01-29T22:24:28.335787Z] Loop 2994: Loss: 1.60e-03, Avg Return: 0.455, Regret: 0.3511, Entropy: 0.0768 +[2026-01-29T22:24:29.495423Z] Loop 2995: Loss: 1.61e-03, Avg Return: 0.452, Regret: 0.3511, Entropy: 0.0794 +[2026-01-29T22:24:30.656354Z] Loop 2996: Loss: 1.07e-03, Avg Return: 0.446, Regret: 0.3511, Entropy: 0.0816 +[2026-01-29T22:24:31.817129Z] Loop 2997: Loss: 1.36e-03, Avg Return: 0.451, Regret: 0.3511, Entropy: 0.0802 +[2026-01-29T22:24:32.977458Z] Loop 2998: Loss: 1.58e-03, Avg Return: 0.456, Regret: 0.3511, Entropy: 0.0812 +[2026-01-29T22:24:34.137246Z] Loop 2999: Loss: 1.68e-03, Avg Return: 0.451, Regret: 0.3511, Entropy: 0.0823 +[2026-01-29T22:24:35.339788Z] Loop 3000: Loss: 1.33e-03, Avg Return: 0.447, Regret: 0.3530, Entropy: 0.0845 +[2026-01-29T22:24:36.500700Z] Loop 3001: Loss: 1.31e-03, Avg Return: 0.450, Regret: 0.3530, Entropy: 0.0849 +[2026-01-29T22:24:37.660954Z] Loop 3002: Loss: 1.16e-03, Avg Return: 0.443, Regret: 0.3530, Entropy: 0.0855 +[2026-01-29T22:24:38.820528Z] Loop 3003: Loss: 1.20e-03, Avg Return: 0.453, Regret: 0.3530, Entropy: 0.0817 +[2026-01-29T22:24:39.981692Z] Loop 3004: Loss: 1.04e-03, Avg Return: 0.449, Regret: 0.3530, Entropy: 0.0792 +[2026-01-29T22:24:41.143083Z] Loop 3005: Loss: 9.12e-04, Avg Return: 0.458, Regret: 0.3530, Entropy: 0.0762 +[2026-01-29T22:24:42.303727Z] Loop 3006: Loss: 7.88e-04, Avg Return: 0.444, Regret: 0.3530, Entropy: 0.0690 +[2026-01-29T22:24:43.464990Z] Loop 3007: Loss: 6.48e-04, Avg Return: 0.457, Regret: 0.3530, Entropy: 0.0730 +[2026-01-29T22:24:44.625371Z] Loop 3008: Loss: 7.68e-04, Avg Return: 0.455, Regret: 0.3530, Entropy: 0.0684 +[2026-01-29T22:24:45.785800Z] Loop 3009: Loss: 9.40e-04, Avg Return: 0.455, Regret: 0.3530, Entropy: 0.0655 +[2026-01-29T22:24:46.997412Z] Loop 3010: Loss: 1.10e-03, Avg Return: 0.451, Regret: 0.3530, Entropy: 0.0762 +[2026-01-29T22:24:48.165312Z] Loop 3011: Loss: 1.21e-03, Avg Return: 0.455, Regret: 0.3530, Entropy: 0.0728 +[2026-01-29T22:24:49.327446Z] Loop 3012: Loss: 1.37e-03, Avg Return: 0.451, Regret: 0.3530, Entropy: 0.0744 +[2026-01-29T22:24:50.490404Z] Loop 3013: Loss: 1.29e-03, Avg Return: 0.441, Regret: 0.3530, Entropy: 0.0759 +[2026-01-29T22:24:51.652421Z] Loop 3014: Loss: 1.47e-03, Avg Return: 0.457, Regret: 0.3530, Entropy: 0.0698 +[2026-01-29T22:24:52.815715Z] Loop 3015: Loss: 1.51e-03, Avg Return: 0.452, Regret: 0.3530, Entropy: 0.0695 +[2026-01-29T22:24:53.977487Z] Loop 3016: Loss: 1.36e-03, Avg Return: 0.456, Regret: 0.3530, Entropy: 0.0739 +[2026-01-29T22:24:55.140086Z] Loop 3017: Loss: 1.30e-03, Avg Return: 0.459, Regret: 0.3530, Entropy: 0.0685 +[2026-01-29T22:24:56.305031Z] Loop 3018: Loss: 1.28e-03, Avg Return: 0.448, Regret: 0.3530, Entropy: 0.0708 +[2026-01-29T22:24:57.467106Z] Loop 3019: Loss: 1.49e-03, Avg Return: 0.453, Regret: 0.3530, Entropy: 0.0704 +[2026-01-29T22:24:58.681001Z] Loop 3020: Loss: 1.43e-03, Avg Return: 0.449, Regret: 0.3520, Entropy: 0.0707 +[2026-01-29T22:24:59.842295Z] Loop 3021: Loss: 1.44e-03, Avg Return: 0.454, Regret: 0.3520, Entropy: 0.0703 +[2026-01-29T22:25:01.004161Z] Loop 3022: Loss: 1.31e-03, Avg Return: 0.453, Regret: 0.3520, Entropy: 0.0722 +[2026-01-29T22:25:02.165251Z] Loop 3023: Loss: 1.26e-03, Avg Return: 0.462, Regret: 0.3520, Entropy: 0.0730 +[2026-01-29T22:25:03.327317Z] Loop 3024: Loss: 1.03e-03, Avg Return: 0.453, Regret: 0.3520, Entropy: 0.0740 +[2026-01-29T22:25:04.487476Z] Loop 3025: Loss: 1.19e-03, Avg Return: 0.462, Regret: 0.3520, Entropy: 0.0734 +[2026-01-29T22:25:05.648007Z] Loop 3026: Loss: 1.07e-03, Avg Return: 0.458, Regret: 0.3520, Entropy: 0.0790 +[2026-01-29T22:25:06.809658Z] Loop 3027: Loss: 9.32e-04, Avg Return: 0.457, Regret: 0.3520, Entropy: 0.0769 +[2026-01-29T22:25:07.969904Z] Loop 3028: Loss: 1.08e-03, Avg Return: 0.451, Regret: 0.3520, Entropy: 0.0761 +[2026-01-29T22:25:09.132608Z] Loop 3029: Loss: 1.06e-03, Avg Return: 0.451, Regret: 0.3520, Entropy: 0.0814 +[2026-01-29T22:25:10.337961Z] Loop 3030: Loss: 1.00e-03, Avg Return: 0.460, Regret: 0.3507, Entropy: 0.0749 +[2026-01-29T22:25:11.499712Z] Loop 3031: Loss: 9.76e-04, Avg Return: 0.453, Regret: 0.3507, Entropy: 0.0752 +[2026-01-29T22:25:12.660228Z] Loop 3032: Loss: 1.04e-03, Avg Return: 0.452, Regret: 0.3507, Entropy: 0.0790 +[2026-01-29T22:25:13.821369Z] Loop 3033: Loss: 1.12e-03, Avg Return: 0.457, Regret: 0.3507, Entropy: 0.0753 +[2026-01-29T22:25:14.980914Z] Loop 3034: Loss: 1.22e-03, Avg Return: 0.448, Regret: 0.3507, Entropy: 0.0815 +[2026-01-29T22:25:16.141933Z] Loop 3035: Loss: 1.07e-03, Avg Return: 0.455, Regret: 0.3507, Entropy: 0.0784 +[2026-01-29T22:25:17.302716Z] Loop 3036: Loss: 1.28e-03, Avg Return: 0.453, Regret: 0.3507, Entropy: 0.0801 +[2026-01-29T22:25:18.462830Z] Loop 3037: Loss: 1.28e-03, Avg Return: 0.449, Regret: 0.3507, Entropy: 0.0881 +[2026-01-29T22:25:19.623984Z] Loop 3038: Loss: 1.41e-03, Avg Return: 0.448, Regret: 0.3507, Entropy: 0.0924 +[2026-01-29T22:25:20.784651Z] Loop 3039: Loss: 1.63e-03, Avg Return: 0.449, Regret: 0.3507, Entropy: 0.0852 +[2026-01-29T22:25:21.990181Z] Loop 3040: Loss: 1.60e-03, Avg Return: 0.447, Regret: 0.3507, Entropy: 0.0876 +[2026-01-29T22:25:23.151128Z] Loop 3041: Loss: 1.62e-03, Avg Return: 0.464, Regret: 0.3507, Entropy: 0.0897 +[2026-01-29T22:25:24.312781Z] Loop 3042: Loss: 1.54e-03, Avg Return: 0.451, Regret: 0.3507, Entropy: 0.0914 +[2026-01-29T22:25:25.476228Z] Loop 3043: Loss: 1.77e-03, Avg Return: 0.446, Regret: 0.3507, Entropy: 0.0983 +[2026-01-29T22:25:26.637917Z] Loop 3044: Loss: 1.76e-03, Avg Return: 0.458, Regret: 0.3507, Entropy: 0.0955 +[2026-01-29T22:25:27.798639Z] Loop 3045: Loss: 1.64e-03, Avg Return: 0.456, Regret: 0.3507, Entropy: 0.0880 +[2026-01-29T22:25:28.959292Z] Loop 3046: Loss: 2.04e-03, Avg Return: 0.457, Regret: 0.3507, Entropy: 0.0944 +[2026-01-29T22:25:30.121785Z] Loop 3047: Loss: 1.80e-03, Avg Return: 0.456, Regret: 0.3507, Entropy: 0.0968 +[2026-01-29T22:25:31.282832Z] Loop 3048: Loss: 1.98e-03, Avg Return: 0.452, Regret: 0.3507, Entropy: 0.0980 +[2026-01-29T22:25:32.444160Z] Loop 3049: Loss: 2.00e-03, Avg Return: 0.458, Regret: 0.3507, Entropy: 0.0979 +[2026-01-29T22:25:33.653707Z] Loop 3050: Loss: 1.98e-03, Avg Return: 0.457, Regret: 0.3507, Entropy: 0.0948 +[2026-01-29T22:25:34.816006Z] Loop 3051: Loss: 2.22e-03, Avg Return: 0.462, Regret: 0.3507, Entropy: 0.0912 +[2026-01-29T22:25:35.976935Z] Loop 3052: Loss: 2.00e-03, Avg Return: 0.458, Regret: 0.3507, Entropy: 0.0904 +[2026-01-29T22:25:37.137821Z] Loop 3053: Loss: 1.73e-03, Avg Return: 0.454, Regret: 0.3507, Entropy: 0.0907 +[2026-01-29T22:25:38.298840Z] Loop 3054: Loss: 1.57e-03, Avg Return: 0.458, Regret: 0.3507, Entropy: 0.0888 +[2026-01-29T22:25:39.458775Z] Loop 3055: Loss: 1.49e-03, Avg Return: 0.446, Regret: 0.3507, Entropy: 0.0910 +[2026-01-29T22:25:40.620409Z] Loop 3056: Loss: 1.27e-03, Avg Return: 0.457, Regret: 0.3507, Entropy: 0.0887 +[2026-01-29T22:25:41.780559Z] Loop 3057: Loss: 1.45e-03, Avg Return: 0.454, Regret: 0.3507, Entropy: 0.0779 +[2026-01-29T22:25:42.941275Z] Loop 3058: Loss: 1.30e-03, Avg Return: 0.449, Regret: 0.3507, Entropy: 0.0786 +[2026-01-29T22:25:44.101268Z] Loop 3059: Loss: 1.18e-03, Avg Return: 0.455, Regret: 0.3507, Entropy: 0.0832 +[2026-01-29T22:25:45.308612Z] Loop 3060: Loss: 1.34e-03, Avg Return: 0.459, Regret: 0.3506, Entropy: 0.0903 +[2026-01-29T22:25:46.470944Z] Loop 3061: Loss: 1.35e-03, Avg Return: 0.457, Regret: 0.3506, Entropy: 0.0844 +[2026-01-29T22:25:47.632679Z] Loop 3062: Loss: 1.44e-03, Avg Return: 0.454, Regret: 0.3506, Entropy: 0.0837 +[2026-01-29T22:25:48.795000Z] Loop 3063: Loss: 1.43e-03, Avg Return: 0.454, Regret: 0.3506, Entropy: 0.0847 +[2026-01-29T22:25:49.956751Z] Loop 3064: Loss: 1.69e-03, Avg Return: 0.464, Regret: 0.3506, Entropy: 0.0810 +[2026-01-29T22:25:51.119032Z] Loop 3065: Loss: 1.44e-03, Avg Return: 0.461, Regret: 0.3506, Entropy: 0.0837 +[2026-01-29T22:25:52.280299Z] Loop 3066: Loss: 1.49e-03, Avg Return: 0.451, Regret: 0.3506, Entropy: 0.0859 +[2026-01-29T22:25:53.441777Z] Loop 3067: Loss: 1.36e-03, Avg Return: 0.452, Regret: 0.3506, Entropy: 0.0871 +[2026-01-29T22:25:54.603275Z] Loop 3068: Loss: 1.37e-03, Avg Return: 0.454, Regret: 0.3506, Entropy: 0.0908 +[2026-01-29T22:25:55.764201Z] Loop 3069: Loss: 1.36e-03, Avg Return: 0.455, Regret: 0.3506, Entropy: 0.0872 +[2026-01-29T22:25:56.971410Z] Loop 3070: Loss: 1.28e-03, Avg Return: 0.458, Regret: 0.3506, Entropy: 0.0870 +[2026-01-29T22:25:58.132215Z] Loop 3071: Loss: 1.17e-03, Avg Return: 0.451, Regret: 0.3506, Entropy: 0.0772 +[2026-01-29T22:25:59.294214Z] Loop 3072: Loss: 1.18e-03, Avg Return: 0.450, Regret: 0.3506, Entropy: 0.0838 +[2026-01-29T22:26:00.455344Z] Loop 3073: Loss: 9.49e-04, Avg Return: 0.447, Regret: 0.3506, Entropy: 0.0770 +[2026-01-29T22:26:01.617622Z] Loop 3074: Loss: 9.97e-04, Avg Return: 0.456, Regret: 0.3506, Entropy: 0.0736 +[2026-01-29T22:26:02.777982Z] Loop 3075: Loss: 9.07e-04, Avg Return: 0.451, Regret: 0.3506, Entropy: 0.0725 +[2026-01-29T22:26:03.939816Z] Loop 3076: Loss: 9.14e-04, Avg Return: 0.451, Regret: 0.3506, Entropy: 0.0768 +[2026-01-29T22:26:05.101317Z] Loop 3077: Loss: 1.01e-03, Avg Return: 0.455, Regret: 0.3506, Entropy: 0.0719 +[2026-01-29T22:26:06.261920Z] Loop 3078: Loss: 1.04e-03, Avg Return: 0.458, Regret: 0.3506, Entropy: 0.0755 +[2026-01-29T22:26:07.424220Z] Loop 3079: Loss: 1.13e-03, Avg Return: 0.446, Regret: 0.3506, Entropy: 0.0730 +[2026-01-29T22:26:08.632281Z] Loop 3080: Loss: 1.08e-03, Avg Return: 0.450, Regret: 0.3513, Entropy: 0.0723 +[2026-01-29T22:26:09.793987Z] Loop 3081: Loss: 1.19e-03, Avg Return: 0.455, Regret: 0.3513, Entropy: 0.0736 +[2026-01-29T22:26:10.953971Z] Loop 3082: Loss: 1.49e-03, Avg Return: 0.442, Regret: 0.3513, Entropy: 0.0747 +[2026-01-29T22:26:12.115002Z] Loop 3083: Loss: 1.85e-03, Avg Return: 0.450, Regret: 0.3513, Entropy: 0.0754 +[2026-01-29T22:26:13.275223Z] Loop 3084: Loss: 2.08e-03, Avg Return: 0.452, Regret: 0.3513, Entropy: 0.0812 +[2026-01-29T22:26:14.435373Z] Loop 3085: Loss: 2.53e-03, Avg Return: 0.450, Regret: 0.3513, Entropy: 0.0907 +[2026-01-29T22:26:15.596749Z] Loop 3086: Loss: 2.34e-03, Avg Return: 0.448, Regret: 0.3513, Entropy: 0.0865 +[2026-01-29T22:26:16.757110Z] Loop 3087: Loss: 2.47e-03, Avg Return: 0.452, Regret: 0.3513, Entropy: 0.0839 +[2026-01-29T22:26:17.918381Z] Loop 3088: Loss: 2.17e-03, Avg Return: 0.448, Regret: 0.3513, Entropy: 0.0845 +[2026-01-29T22:26:19.077790Z] Loop 3089: Loss: 2.21e-03, Avg Return: 0.450, Regret: 0.3513, Entropy: 0.0802 +[2026-01-29T22:26:20.283701Z] Loop 3090: Loss: 1.87e-03, Avg Return: 0.443, Regret: 0.3548, Entropy: 0.0783 +[2026-01-29T22:26:21.445119Z] Loop 3091: Loss: 2.33e-03, Avg Return: 0.456, Regret: 0.3548, Entropy: 0.0782 +[2026-01-29T22:26:22.607499Z] Loop 3092: Loss: 2.40e-03, Avg Return: 0.454, Regret: 0.3548, Entropy: 0.0856 +[2026-01-29T22:26:23.768634Z] Loop 3093: Loss: 2.32e-03, Avg Return: 0.450, Regret: 0.3548, Entropy: 0.0876 +[2026-01-29T22:26:24.929697Z] Loop 3094: Loss: 2.32e-03, Avg Return: 0.451, Regret: 0.3548, Entropy: 0.0872 +[2026-01-29T22:26:26.089591Z] Loop 3095: Loss: 2.71e-03, Avg Return: 0.457, Regret: 0.3548, Entropy: 0.0904 +[2026-01-29T22:26:27.250172Z] Loop 3096: Loss: 2.42e-03, Avg Return: 0.449, Regret: 0.3548, Entropy: 0.0942 +[2026-01-29T22:26:28.411860Z] Loop 3097: Loss: 2.43e-03, Avg Return: 0.448, Regret: 0.3548, Entropy: 0.0913 +[2026-01-29T22:26:29.572210Z] Loop 3098: Loss: 2.58e-03, Avg Return: 0.455, Regret: 0.3548, Entropy: 0.0910 +[2026-01-29T22:26:30.733239Z] Loop 3099: Loss: 2.47e-03, Avg Return: 0.455, Regret: 0.3548, Entropy: 0.0904 +[2026-01-29T22:26:31.938370Z] Loop 3100: Loss: 2.37e-03, Avg Return: 0.452, Regret: 0.3517, Entropy: 0.0942 +[2026-01-29T22:26:33.101267Z] Loop 3101: Loss: 2.41e-03, Avg Return: 0.447, Regret: 0.3517, Entropy: 0.0988 +[2026-01-29T22:26:34.264343Z] Loop 3102: Loss: 2.54e-03, Avg Return: 0.450, Regret: 0.3517, Entropy: 0.0895 +[2026-01-29T22:26:35.425921Z] Loop 3103: Loss: 2.65e-03, Avg Return: 0.451, Regret: 0.3517, Entropy: 0.0963 +[2026-01-29T22:26:36.586165Z] Loop 3104: Loss: 2.54e-03, Avg Return: 0.453, Regret: 0.3517, Entropy: 0.0981 +[2026-01-29T22:26:37.748432Z] Loop 3105: Loss: 2.33e-03, Avg Return: 0.457, Regret: 0.3517, Entropy: 0.0883 +[2026-01-29T22:26:38.911291Z] Loop 3106: Loss: 1.56e-03, Avg Return: 0.439, Regret: 0.3517, Entropy: 0.0735 +[2026-01-29T22:26:40.071336Z] Loop 3107: Loss: 1.21e-03, Avg Return: 0.452, Regret: 0.3517, Entropy: 0.0736 +[2026-01-29T22:26:41.232746Z] Loop 3108: Loss: 9.27e-04, Avg Return: 0.446, Regret: 0.3517, Entropy: 0.0652 +[2026-01-29T22:26:42.392940Z] Loop 3109: Loss: 8.16e-04, Avg Return: 0.451, Regret: 0.3517, Entropy: 0.0674 +[2026-01-29T22:26:43.604688Z] Loop 3110: Loss: 9.55e-04, Avg Return: 0.450, Regret: 0.3554, Entropy: 0.0617 +[2026-01-29T22:26:44.766971Z] Loop 3111: Loss: 1.04e-03, Avg Return: 0.455, Regret: 0.3554, Entropy: 0.0638 +[2026-01-29T22:26:45.927987Z] Loop 3112: Loss: 1.01e-03, Avg Return: 0.441, Regret: 0.3554, Entropy: 0.0675 +[2026-01-29T22:26:47.089854Z] Loop 3113: Loss: 1.10e-03, Avg Return: 0.452, Regret: 0.3554, Entropy: 0.0674 +[2026-01-29T22:26:48.251462Z] Loop 3114: Loss: 1.16e-03, Avg Return: 0.444, Regret: 0.3554, Entropy: 0.0699 +[2026-01-29T22:26:49.413863Z] Loop 3115: Loss: 1.11e-03, Avg Return: 0.441, Regret: 0.3554, Entropy: 0.0699 +[2026-01-29T22:26:50.574261Z] Loop 3116: Loss: 9.91e-04, Avg Return: 0.451, Regret: 0.3554, Entropy: 0.0688 +[2026-01-29T22:26:51.735117Z] Loop 3117: Loss: 9.03e-04, Avg Return: 0.451, Regret: 0.3554, Entropy: 0.0655 +[2026-01-29T22:26:52.901362Z] Loop 3118: Loss: 1.00e-03, Avg Return: 0.447, Regret: 0.3554, Entropy: 0.0640 +[2026-01-29T22:26:54.061911Z] Loop 3119: Loss: 1.02e-03, Avg Return: 0.445, Regret: 0.3554, Entropy: 0.0684 +[2026-01-29T22:26:55.274515Z] Loop 3120: Loss: 1.17e-03, Avg Return: 0.451, Regret: 0.3526, Entropy: 0.0703 +[2026-01-29T22:26:56.436610Z] Loop 3121: Loss: 1.72e-03, Avg Return: 0.450, Regret: 0.3526, Entropy: 0.0756 +[2026-01-29T22:26:57.597667Z] Loop 3122: Loss: 2.18e-03, Avg Return: 0.447, Regret: 0.3526, Entropy: 0.0996 +[2026-01-29T22:26:58.757128Z] Loop 3123: Loss: 2.48e-03, Avg Return: 0.450, Regret: 0.3526, Entropy: 0.1062 +[2026-01-29T22:26:59.918313Z] Loop 3124: Loss: 2.91e-03, Avg Return: 0.449, Regret: 0.3526, Entropy: 0.1111 +[2026-01-29T22:27:01.079218Z] Loop 3125: Loss: 2.71e-03, Avg Return: 0.451, Regret: 0.3526, Entropy: 0.1034 +[2026-01-29T22:27:02.239371Z] Loop 3126: Loss: 2.76e-03, Avg Return: 0.451, Regret: 0.3526, Entropy: 0.1047 +[2026-01-29T22:27:03.400492Z] Loop 3127: Loss: 2.48e-03, Avg Return: 0.450, Regret: 0.3526, Entropy: 0.0985 +[2026-01-29T22:27:04.561537Z] Loop 3128: Loss: 2.09e-03, Avg Return: 0.455, Regret: 0.3526, Entropy: 0.0995 +[2026-01-29T22:27:05.725669Z] Loop 3129: Loss: 1.92e-03, Avg Return: 0.452, Regret: 0.3526, Entropy: 0.0913 +[2026-01-29T22:27:06.931714Z] Loop 3130: Loss: 1.53e-03, Avg Return: 0.459, Regret: 0.3508, Entropy: 0.0834 +[2026-01-29T22:27:08.093101Z] Loop 3131: Loss: 1.43e-03, Avg Return: 0.458, Regret: 0.3508, Entropy: 0.0863 +[2026-01-29T22:27:09.254267Z] Loop 3132: Loss: 1.03e-03, Avg Return: 0.454, Regret: 0.3508, Entropy: 0.0825 +[2026-01-29T22:27:10.417268Z] Loop 3133: Loss: 7.24e-04, Avg Return: 0.454, Regret: 0.3508, Entropy: 0.0816 +[2026-01-29T22:27:11.578869Z] Loop 3134: Loss: 7.27e-04, Avg Return: 0.456, Regret: 0.3508, Entropy: 0.0771 +[2026-01-29T22:27:12.739400Z] Loop 3135: Loss: 1.00e-03, Avg Return: 0.451, Regret: 0.3508, Entropy: 0.0731 +[2026-01-29T22:27:13.900845Z] Loop 3136: Loss: 1.15e-03, Avg Return: 0.455, Regret: 0.3508, Entropy: 0.0727 +[2026-01-29T22:27:15.061890Z] Loop 3137: Loss: 1.41e-03, Avg Return: 0.453, Regret: 0.3508, Entropy: 0.0815 +[2026-01-29T22:27:16.224478Z] Loop 3138: Loss: 1.66e-03, Avg Return: 0.458, Regret: 0.3508, Entropy: 0.0827 +[2026-01-29T22:27:17.385988Z] Loop 3139: Loss: 1.29e-03, Avg Return: 0.458, Regret: 0.3508, Entropy: 0.0722 +[2026-01-29T22:27:18.594930Z] Loop 3140: Loss: 1.30e-03, Avg Return: 0.446, Regret: 0.3508, Entropy: 0.0759 +[2026-01-29T22:27:19.757517Z] Loop 3141: Loss: 1.57e-03, Avg Return: 0.451, Regret: 0.3508, Entropy: 0.0709 +[2026-01-29T22:27:20.919244Z] Loop 3142: Loss: 1.68e-03, Avg Return: 0.457, Regret: 0.3508, Entropy: 0.0700 +[2026-01-29T22:27:22.081264Z] Loop 3143: Loss: 2.02e-03, Avg Return: 0.457, Regret: 0.3508, Entropy: 0.0749 +[2026-01-29T22:27:23.242423Z] Loop 3144: Loss: 1.78e-03, Avg Return: 0.451, Regret: 0.3508, Entropy: 0.0769 +[2026-01-29T22:27:24.404497Z] Loop 3145: Loss: 1.74e-03, Avg Return: 0.456, Regret: 0.3508, Entropy: 0.0717 +[2026-01-29T22:27:25.565427Z] Loop 3146: Loss: 1.73e-03, Avg Return: 0.455, Regret: 0.3508, Entropy: 0.0755 +[2026-01-29T22:27:26.726207Z] Loop 3147: Loss: 1.67e-03, Avg Return: 0.448, Regret: 0.3508, Entropy: 0.0678 +[2026-01-29T22:27:27.888058Z] Loop 3148: Loss: 1.45e-03, Avg Return: 0.453, Regret: 0.3508, Entropy: 0.0673 +[2026-01-29T22:27:29.048376Z] Loop 3149: Loss: 1.17e-03, Avg Return: 0.458, Regret: 0.3508, Entropy: 0.0728 +[2026-01-29T22:27:30.255406Z] Loop 3150: Loss: 1.12e-03, Avg Return: 0.451, Regret: 0.3508, Entropy: 0.0705 +[2026-01-29T22:27:31.416668Z] Loop 3151: Loss: 1.01e-03, Avg Return: 0.454, Regret: 0.3508, Entropy: 0.0703 +[2026-01-29T22:27:32.578934Z] Loop 3152: Loss: 1.07e-03, Avg Return: 0.448, Regret: 0.3508, Entropy: 0.0676 +[2026-01-29T22:27:33.740626Z] Loop 3153: Loss: 1.12e-03, Avg Return: 0.448, Regret: 0.3508, Entropy: 0.0679 +[2026-01-29T22:27:34.902979Z] Loop 3154: Loss: 1.11e-03, Avg Return: 0.455, Regret: 0.3508, Entropy: 0.0656 +[2026-01-29T22:27:36.063678Z] Loop 3155: Loss: 9.31e-04, Avg Return: 0.455, Regret: 0.3508, Entropy: 0.0671 +[2026-01-29T22:27:37.225316Z] Loop 3156: Loss: 1.36e-03, Avg Return: 0.455, Regret: 0.3508, Entropy: 0.0696 +[2026-01-29T22:27:38.387275Z] Loop 3157: Loss: 1.02e-03, Avg Return: 0.450, Regret: 0.3508, Entropy: 0.0753 +[2026-01-29T22:27:39.548050Z] Loop 3158: Loss: 1.01e-03, Avg Return: 0.452, Regret: 0.3508, Entropy: 0.0653 +[2026-01-29T22:27:40.710745Z] Loop 3159: Loss: 1.15e-03, Avg Return: 0.455, Regret: 0.3508, Entropy: 0.0706 +[2026-01-29T22:27:41.922303Z] Loop 3160: Loss: 1.21e-03, Avg Return: 0.446, Regret: 0.3507, Entropy: 0.0658 +[2026-01-29T22:27:43.083962Z] Loop 3161: Loss: 1.10e-03, Avg Return: 0.450, Regret: 0.3507, Entropy: 0.0712 +[2026-01-29T22:27:44.244672Z] Loop 3162: Loss: 1.11e-03, Avg Return: 0.456, Regret: 0.3507, Entropy: 0.0662 +[2026-01-29T22:27:45.406508Z] Loop 3163: Loss: 1.28e-03, Avg Return: 0.456, Regret: 0.3507, Entropy: 0.0713 +[2026-01-29T22:27:46.568900Z] Loop 3164: Loss: 1.23e-03, Avg Return: 0.462, Regret: 0.3507, Entropy: 0.0686 +[2026-01-29T22:27:47.730475Z] Loop 3165: Loss: 1.11e-03, Avg Return: 0.444, Regret: 0.3507, Entropy: 0.0676 +[2026-01-29T22:27:48.892299Z] Loop 3166: Loss: 1.20e-03, Avg Return: 0.457, Regret: 0.3507, Entropy: 0.0658 +[2026-01-29T22:27:50.052496Z] Loop 3167: Loss: 1.24e-03, Avg Return: 0.456, Regret: 0.3507, Entropy: 0.0709 +[2026-01-29T22:27:51.214320Z] Loop 3168: Loss: 1.25e-03, Avg Return: 0.453, Regret: 0.3507, Entropy: 0.0679 +[2026-01-29T22:27:52.378220Z] Loop 3169: Loss: 1.08e-03, Avg Return: 0.458, Regret: 0.3507, Entropy: 0.0733 +[2026-01-29T22:27:53.586171Z] Loop 3170: Loss: 1.09e-03, Avg Return: 0.447, Regret: 0.3507, Entropy: 0.0680 +[2026-01-29T22:27:54.747655Z] Loop 3171: Loss: 1.05e-03, Avg Return: 0.450, Regret: 0.3507, Entropy: 0.0690 +[2026-01-29T22:27:55.908557Z] Loop 3172: Loss: 1.10e-03, Avg Return: 0.457, Regret: 0.3507, Entropy: 0.0649 +[2026-01-29T22:27:57.071549Z] Loop 3173: Loss: 1.35e-03, Avg Return: 0.449, Regret: 0.3507, Entropy: 0.0669 +[2026-01-29T22:27:58.232621Z] Loop 3174: Loss: 1.12e-03, Avg Return: 0.459, Regret: 0.3507, Entropy: 0.0672 +[2026-01-29T22:27:59.393506Z] Loop 3175: Loss: 1.02e-03, Avg Return: 0.447, Regret: 0.3507, Entropy: 0.0660 +[2026-01-29T22:28:00.553395Z] Loop 3176: Loss: 1.10e-03, Avg Return: 0.456, Regret: 0.3507, Entropy: 0.0722 +[2026-01-29T22:28:01.714222Z] Loop 3177: Loss: 1.07e-03, Avg Return: 0.451, Regret: 0.3507, Entropy: 0.0686 +[2026-01-29T22:28:02.876556Z] Loop 3178: Loss: 1.21e-03, Avg Return: 0.460, Regret: 0.3507, Entropy: 0.0684 +[2026-01-29T22:28:04.037072Z] Loop 3179: Loss: 1.35e-03, Avg Return: 0.461, Regret: 0.3507, Entropy: 0.0710 +[2026-01-29T22:28:05.247078Z] Loop 3180: Loss: 1.39e-03, Avg Return: 0.460, Regret: 0.3507, Entropy: 0.0697 +[2026-01-29T22:28:06.409340Z] Loop 3181: Loss: 1.25e-03, Avg Return: 0.451, Regret: 0.3507, Entropy: 0.0692 +[2026-01-29T22:28:07.571585Z] Loop 3182: Loss: 1.07e-03, Avg Return: 0.442, Regret: 0.3507, Entropy: 0.0686 +[2026-01-29T22:28:08.732566Z] Loop 3183: Loss: 9.84e-04, Avg Return: 0.456, Regret: 0.3507, Entropy: 0.0669 +[2026-01-29T22:28:09.894444Z] Loop 3184: Loss: 9.73e-04, Avg Return: 0.454, Regret: 0.3507, Entropy: 0.0682 +[2026-01-29T22:28:11.054995Z] Loop 3185: Loss: 8.33e-04, Avg Return: 0.455, Regret: 0.3507, Entropy: 0.0713 +[2026-01-29T22:28:12.216224Z] Loop 3186: Loss: 8.59e-04, Avg Return: 0.455, Regret: 0.3507, Entropy: 0.0697 +[2026-01-29T22:28:13.379058Z] Loop 3187: Loss: 7.29e-04, Avg Return: 0.451, Regret: 0.3507, Entropy: 0.0714 +[2026-01-29T22:28:14.540182Z] Loop 3188: Loss: 8.54e-04, Avg Return: 0.448, Regret: 0.3507, Entropy: 0.0735 +[2026-01-29T22:28:15.701689Z] Loop 3189: Loss: 8.11e-04, Avg Return: 0.447, Regret: 0.3507, Entropy: 0.0739 +[2026-01-29T22:28:16.910326Z] Loop 3190: Loss: 9.60e-04, Avg Return: 0.456, Regret: 0.3511, Entropy: 0.0764 +[2026-01-29T22:28:18.072319Z] Loop 3191: Loss: 1.10e-03, Avg Return: 0.467, Regret: 0.3511, Entropy: 0.0704 +[2026-01-29T22:28:19.234103Z] Loop 3192: Loss: 9.88e-04, Avg Return: 0.443, Regret: 0.3511, Entropy: 0.0769 +[2026-01-29T22:28:20.394803Z] Loop 3193: Loss: 1.07e-03, Avg Return: 0.456, Regret: 0.3511, Entropy: 0.0751 +[2026-01-29T22:28:21.556890Z] Loop 3194: Loss: 9.59e-04, Avg Return: 0.451, Regret: 0.3511, Entropy: 0.0738 +[2026-01-29T22:28:22.717833Z] Loop 3195: Loss: 1.09e-03, Avg Return: 0.455, Regret: 0.3511, Entropy: 0.0754 +[2026-01-29T22:28:23.882576Z] Loop 3196: Loss: 1.14e-03, Avg Return: 0.454, Regret: 0.3511, Entropy: 0.0803 +[2026-01-29T22:28:25.043578Z] Loop 3197: Loss: 1.18e-03, Avg Return: 0.441, Regret: 0.3511, Entropy: 0.0874 +[2026-01-29T22:28:26.204274Z] Loop 3198: Loss: 1.25e-03, Avg Return: 0.458, Regret: 0.3511, Entropy: 0.0766 +[2026-01-29T22:28:27.366433Z] Loop 3199: Loss: 1.72e-03, Avg Return: 0.458, Regret: 0.3511, Entropy: 0.0869 +[2026-01-29T22:28:28.577295Z] Loop 3200: Loss: 2.05e-03, Avg Return: 0.454, Regret: 0.3508, Entropy: 0.0833 +[2026-01-29T22:28:29.740347Z] Loop 3201: Loss: 2.05e-03, Avg Return: 0.449, Regret: 0.3508, Entropy: 0.0946 +[2026-01-29T22:28:30.901553Z] Loop 3202: Loss: 2.37e-03, Avg Return: 0.459, Regret: 0.3508, Entropy: 0.1001 +[2026-01-29T22:28:32.063192Z] Loop 3203: Loss: 2.22e-03, Avg Return: 0.460, Regret: 0.3508, Entropy: 0.0894 +[2026-01-29T22:28:33.223416Z] Loop 3204: Loss: 1.83e-03, Avg Return: 0.455, Regret: 0.3508, Entropy: 0.0874 +[2026-01-29T22:28:34.386228Z] Loop 3205: Loss: 1.43e-03, Avg Return: 0.456, Regret: 0.3508, Entropy: 0.0781 +[2026-01-29T22:28:35.547185Z] Loop 3206: Loss: 1.05e-03, Avg Return: 0.452, Regret: 0.3508, Entropy: 0.0750 +[2026-01-29T22:28:36.708585Z] Loop 3207: Loss: 9.23e-04, Avg Return: 0.459, Regret: 0.3508, Entropy: 0.0712 +[2026-01-29T22:28:37.870675Z] Loop 3208: Loss: 9.00e-04, Avg Return: 0.444, Regret: 0.3508, Entropy: 0.0737 +[2026-01-29T22:28:39.030710Z] Loop 3209: Loss: 1.04e-03, Avg Return: 0.453, Regret: 0.3508, Entropy: 0.0735 +[2026-01-29T22:28:40.240507Z] Loop 3210: Loss: 1.14e-03, Avg Return: 0.455, Regret: 0.3507, Entropy: 0.0688 +[2026-01-29T22:28:41.401948Z] Loop 3211: Loss: 1.16e-03, Avg Return: 0.440, Regret: 0.3507, Entropy: 0.0728 +[2026-01-29T22:28:42.563347Z] Loop 3212: Loss: 1.51e-03, Avg Return: 0.453, Regret: 0.3507, Entropy: 0.0690 +[2026-01-29T22:28:43.724097Z] Loop 3213: Loss: 1.42e-03, Avg Return: 0.453, Regret: 0.3507, Entropy: 0.0724 +[2026-01-29T22:28:44.885653Z] Loop 3214: Loss: 1.29e-03, Avg Return: 0.452, Regret: 0.3507, Entropy: 0.0770 +[2026-01-29T22:28:46.047489Z] Loop 3215: Loss: 1.18e-03, Avg Return: 0.455, Regret: 0.3507, Entropy: 0.0728 +[2026-01-29T22:28:47.208722Z] Loop 3216: Loss: 1.30e-03, Avg Return: 0.455, Regret: 0.3507, Entropy: 0.0714 +[2026-01-29T22:28:48.370654Z] Loop 3217: Loss: 1.12e-03, Avg Return: 0.449, Regret: 0.3507, Entropy: 0.0705 +[2026-01-29T22:28:49.530877Z] Loop 3218: Loss: 1.09e-03, Avg Return: 0.448, Regret: 0.3507, Entropy: 0.0722 +[2026-01-29T22:28:50.697131Z] Loop 3219: Loss: 9.01e-04, Avg Return: 0.444, Regret: 0.3507, Entropy: 0.0693 +[2026-01-29T22:28:51.907539Z] Loop 3220: Loss: 7.82e-04, Avg Return: 0.449, Regret: 0.3507, Entropy: 0.0698 +[2026-01-29T22:28:53.068178Z] Loop 3221: Loss: 8.79e-04, Avg Return: 0.451, Regret: 0.3507, Entropy: 0.0679 +[2026-01-29T22:28:54.228867Z] Loop 3222: Loss: 7.80e-04, Avg Return: 0.448, Regret: 0.3507, Entropy: 0.0676 +[2026-01-29T22:28:55.389886Z] Loop 3223: Loss: 8.43e-04, Avg Return: 0.454, Regret: 0.3507, Entropy: 0.0664 +[2026-01-29T22:28:56.551881Z] Loop 3224: Loss: 7.98e-04, Avg Return: 0.451, Regret: 0.3507, Entropy: 0.0628 +[2026-01-29T22:28:57.713032Z] Loop 3225: Loss: 9.22e-04, Avg Return: 0.448, Regret: 0.3507, Entropy: 0.0630 +[2026-01-29T22:28:58.874731Z] Loop 3226: Loss: 9.57e-04, Avg Return: 0.453, Regret: 0.3507, Entropy: 0.0644 +[2026-01-29T22:29:00.035210Z] Loop 3227: Loss: 7.92e-04, Avg Return: 0.445, Regret: 0.3507, Entropy: 0.0702 +[2026-01-29T22:29:01.196180Z] Loop 3228: Loss: 1.04e-03, Avg Return: 0.448, Regret: 0.3507, Entropy: 0.0639 +[2026-01-29T22:29:02.357963Z] Loop 3229: Loss: 9.66e-04, Avg Return: 0.448, Regret: 0.3507, Entropy: 0.0676 +[2026-01-29T22:29:03.567084Z] Loop 3230: Loss: 1.05e-03, Avg Return: 0.456, Regret: 0.3507, Entropy: 0.0636 +[2026-01-29T22:29:04.728852Z] Loop 3231: Loss: 1.14e-03, Avg Return: 0.459, Regret: 0.3507, Entropy: 0.0666 +[2026-01-29T22:29:05.890113Z] Loop 3232: Loss: 9.91e-04, Avg Return: 0.453, Regret: 0.3507, Entropy: 0.0647 +[2026-01-29T22:29:07.052832Z] Loop 3233: Loss: 9.03e-04, Avg Return: 0.449, Regret: 0.3507, Entropy: 0.0699 +[2026-01-29T22:29:08.213388Z] Loop 3234: Loss: 9.33e-04, Avg Return: 0.456, Regret: 0.3507, Entropy: 0.0598 +[2026-01-29T22:29:09.375159Z] Loop 3235: Loss: 9.33e-04, Avg Return: 0.450, Regret: 0.3507, Entropy: 0.0615 +[2026-01-29T22:29:10.537543Z] Loop 3236: Loss: 7.83e-04, Avg Return: 0.455, Regret: 0.3507, Entropy: 0.0648 +[2026-01-29T22:29:11.699275Z] Loop 3237: Loss: 7.55e-04, Avg Return: 0.450, Regret: 0.3507, Entropy: 0.0659 +[2026-01-29T22:29:12.861290Z] Loop 3238: Loss: 7.31e-04, Avg Return: 0.445, Regret: 0.3507, Entropy: 0.0609 +[2026-01-29T22:29:14.021422Z] Loop 3239: Loss: 7.26e-04, Avg Return: 0.450, Regret: 0.3507, Entropy: 0.0630 +[2026-01-29T22:29:15.232386Z] Loop 3240: Loss: 6.18e-04, Avg Return: 0.458, Regret: 0.3507, Entropy: 0.0613 +[2026-01-29T22:29:16.393057Z] Loop 3241: Loss: 5.39e-04, Avg Return: 0.455, Regret: 0.3507, Entropy: 0.0674 +[2026-01-29T22:29:17.554874Z] Loop 3242: Loss: 5.87e-04, Avg Return: 0.450, Regret: 0.3507, Entropy: 0.0649 +[2026-01-29T22:29:18.715817Z] Loop 3243: Loss: 5.53e-04, Avg Return: 0.454, Regret: 0.3507, Entropy: 0.0620 +[2026-01-29T22:29:19.878161Z] Loop 3244: Loss: 7.88e-04, Avg Return: 0.458, Regret: 0.3507, Entropy: 0.0709 +[2026-01-29T22:29:21.041160Z] Loop 3245: Loss: 6.00e-04, Avg Return: 0.451, Regret: 0.3507, Entropy: 0.0658 +[2026-01-29T22:29:22.203726Z] Loop 3246: Loss: 6.98e-04, Avg Return: 0.451, Regret: 0.3507, Entropy: 0.0677 +[2026-01-29T22:29:23.365313Z] Loop 3247: Loss: 8.02e-04, Avg Return: 0.456, Regret: 0.3507, Entropy: 0.0713 +[2026-01-29T22:29:24.526669Z] Loop 3248: Loss: 7.91e-04, Avg Return: 0.454, Regret: 0.3507, Entropy: 0.0666 +[2026-01-29T22:29:25.686782Z] Loop 3249: Loss: 8.32e-04, Avg Return: 0.444, Regret: 0.3507, Entropy: 0.0715 +[2026-01-29T22:29:26.893027Z] Loop 3250: Loss: 8.59e-04, Avg Return: 0.455, Regret: 0.3510, Entropy: 0.0765 +[2026-01-29T22:29:28.055462Z] Loop 3251: Loss: 9.91e-04, Avg Return: 0.458, Regret: 0.3510, Entropy: 0.0719 +[2026-01-29T22:29:29.215659Z] Loop 3252: Loss: 9.04e-04, Avg Return: 0.448, Regret: 0.3510, Entropy: 0.0737 +[2026-01-29T22:29:30.376494Z] Loop 3253: Loss: 7.58e-04, Avg Return: 0.455, Regret: 0.3510, Entropy: 0.0725 +[2026-01-29T22:29:31.539610Z] Loop 3254: Loss: 8.44e-04, Avg Return: 0.456, Regret: 0.3510, Entropy: 0.0742 +[2026-01-29T22:29:32.701764Z] Loop 3255: Loss: 6.46e-04, Avg Return: 0.453, Regret: 0.3510, Entropy: 0.0667 +[2026-01-29T22:29:33.863518Z] Loop 3256: Loss: 7.77e-04, Avg Return: 0.452, Regret: 0.3510, Entropy: 0.0657 +[2026-01-29T22:29:35.023526Z] Loop 3257: Loss: 7.94e-04, Avg Return: 0.454, Regret: 0.3510, Entropy: 0.0743 +[2026-01-29T22:29:36.184690Z] Loop 3258: Loss: 9.47e-04, Avg Return: 0.451, Regret: 0.3510, Entropy: 0.0691 +[2026-01-29T22:29:37.348056Z] Loop 3259: Loss: 8.56e-04, Avg Return: 0.456, Regret: 0.3510, Entropy: 0.0676 +[2026-01-29T22:29:38.555656Z] Loop 3260: Loss: 8.84e-04, Avg Return: 0.451, Regret: 0.3511, Entropy: 0.0723 +[2026-01-29T22:29:39.717226Z] Loop 3261: Loss: 9.03e-04, Avg Return: 0.462, Regret: 0.3511, Entropy: 0.0671 +[2026-01-29T22:29:40.877897Z] Loop 3262: Loss: 8.21e-04, Avg Return: 0.460, Regret: 0.3511, Entropy: 0.0669 +[2026-01-29T22:29:42.039190Z] Loop 3263: Loss: 8.05e-04, Avg Return: 0.451, Regret: 0.3511, Entropy: 0.0734 +[2026-01-29T22:29:43.199351Z] Loop 3264: Loss: 7.95e-04, Avg Return: 0.450, Regret: 0.3511, Entropy: 0.0707 +[2026-01-29T22:29:44.360486Z] Loop 3265: Loss: 6.82e-04, Avg Return: 0.460, Regret: 0.3511, Entropy: 0.0680 +[2026-01-29T22:29:45.520812Z] Loop 3266: Loss: 4.42e-04, Avg Return: 0.446, Regret: 0.3511, Entropy: 0.0677 +[2026-01-29T22:29:46.681733Z] Loop 3267: Loss: 5.84e-04, Avg Return: 0.449, Regret: 0.3511, Entropy: 0.0610 +[2026-01-29T22:29:47.843327Z] Loop 3268: Loss: 5.08e-04, Avg Return: 0.450, Regret: 0.3511, Entropy: 0.0621 +[2026-01-29T22:29:49.004307Z] Loop 3269: Loss: 6.04e-04, Avg Return: 0.460, Regret: 0.3511, Entropy: 0.0621 +[2026-01-29T22:29:50.211681Z] Loop 3270: Loss: 6.47e-04, Avg Return: 0.449, Regret: 0.3508, Entropy: 0.0637 +[2026-01-29T22:29:51.373198Z] Loop 3271: Loss: 6.86e-04, Avg Return: 0.453, Regret: 0.3508, Entropy: 0.0635 +[2026-01-29T22:29:52.534593Z] Loop 3272: Loss: 6.47e-04, Avg Return: 0.454, Regret: 0.3508, Entropy: 0.0657 +[2026-01-29T22:29:53.694619Z] Loop 3273: Loss: 5.88e-04, Avg Return: 0.452, Regret: 0.3508, Entropy: 0.0616 +[2026-01-29T22:29:54.855672Z] Loop 3274: Loss: 6.29e-04, Avg Return: 0.441, Regret: 0.3508, Entropy: 0.0688 +[2026-01-29T22:29:56.015652Z] Loop 3275: Loss: 5.77e-04, Avg Return: 0.451, Regret: 0.3508, Entropy: 0.0637 +[2026-01-29T22:29:57.176147Z] Loop 3276: Loss: 5.52e-04, Avg Return: 0.448, Regret: 0.3508, Entropy: 0.0647 +[2026-01-29T22:29:58.337643Z] Loop 3277: Loss: 4.87e-04, Avg Return: 0.450, Regret: 0.3508, Entropy: 0.0669 +[2026-01-29T22:29:59.498484Z] Loop 3278: Loss: 6.71e-04, Avg Return: 0.459, Regret: 0.3508, Entropy: 0.0717 +[2026-01-29T22:30:00.660005Z] Loop 3279: Loss: 6.33e-04, Avg Return: 0.453, Regret: 0.3508, Entropy: 0.0590 +[2026-01-29T22:30:01.865138Z] Loop 3280: Loss: 6.69e-04, Avg Return: 0.454, Regret: 0.3507, Entropy: 0.0683 +[2026-01-29T22:30:03.027114Z] Loop 3281: Loss: 6.66e-04, Avg Return: 0.452, Regret: 0.3507, Entropy: 0.0689 +[2026-01-29T22:30:04.190272Z] Loop 3282: Loss: 6.23e-04, Avg Return: 0.449, Regret: 0.3507, Entropy: 0.0724 +[2026-01-29T22:30:05.351207Z] Loop 3283: Loss: 7.40e-04, Avg Return: 0.456, Regret: 0.3507, Entropy: 0.0726 +[2026-01-29T22:30:06.511494Z] Loop 3284: Loss: 8.84e-04, Avg Return: 0.455, Regret: 0.3507, Entropy: 0.0730 +[2026-01-29T22:30:07.671949Z] Loop 3285: Loss: 7.69e-04, Avg Return: 0.454, Regret: 0.3507, Entropy: 0.0724 +[2026-01-29T22:30:08.834741Z] Loop 3286: Loss: 6.73e-04, Avg Return: 0.455, Regret: 0.3507, Entropy: 0.0657 +[2026-01-29T22:30:09.996700Z] Loop 3287: Loss: 6.06e-04, Avg Return: 0.453, Regret: 0.3507, Entropy: 0.0663 +[2026-01-29T22:30:11.157902Z] Loop 3288: Loss: 5.93e-04, Avg Return: 0.455, Regret: 0.3507, Entropy: 0.0634 +[2026-01-29T22:30:12.317873Z] Loop 3289: Loss: 6.41e-04, Avg Return: 0.453, Regret: 0.3507, Entropy: 0.0639 +[2026-01-29T22:30:13.533337Z] Loop 3290: Loss: 5.72e-04, Avg Return: 0.455, Regret: 0.3506, Entropy: 0.0652 +[2026-01-29T22:30:14.693969Z] Loop 3291: Loss: 6.75e-04, Avg Return: 0.451, Regret: 0.3506, Entropy: 0.0625 +[2026-01-29T22:30:15.855859Z] Loop 3292: Loss: 7.03e-04, Avg Return: 0.449, Regret: 0.3506, Entropy: 0.0643 +[2026-01-29T22:30:17.017684Z] Loop 3293: Loss: 6.17e-04, Avg Return: 0.455, Regret: 0.3506, Entropy: 0.0616 +[2026-01-29T22:30:18.178659Z] Loop 3294: Loss: 6.80e-04, Avg Return: 0.452, Regret: 0.3506, Entropy: 0.0675 +[2026-01-29T22:30:19.340346Z] Loop 3295: Loss: 5.73e-04, Avg Return: 0.453, Regret: 0.3506, Entropy: 0.0684 +[2026-01-29T22:30:20.500802Z] Loop 3296: Loss: 7.16e-04, Avg Return: 0.449, Regret: 0.3506, Entropy: 0.0650 +[2026-01-29T22:30:21.662240Z] Loop 3297: Loss: 7.41e-04, Avg Return: 0.465, Regret: 0.3506, Entropy: 0.0607 +[2026-01-29T22:30:22.823924Z] Loop 3298: Loss: 7.49e-04, Avg Return: 0.457, Regret: 0.3506, Entropy: 0.0646 +[2026-01-29T22:30:23.984930Z] Loop 3299: Loss: 7.74e-04, Avg Return: 0.443, Regret: 0.3506, Entropy: 0.0685 +[2026-01-29T22:30:25.192158Z] Loop 3300: Loss: 9.81e-04, Avg Return: 0.454, Regret: 0.3507, Entropy: 0.0719 +[2026-01-29T22:30:26.353291Z] Loop 3301: Loss: 9.86e-04, Avg Return: 0.452, Regret: 0.3507, Entropy: 0.0742 +[2026-01-29T22:30:27.515425Z] Loop 3302: Loss: 1.39e-03, Avg Return: 0.453, Regret: 0.3507, Entropy: 0.0704 +[2026-01-29T22:30:28.676729Z] Loop 3303: Loss: 1.47e-03, Avg Return: 0.445, Regret: 0.3507, Entropy: 0.0732 +[2026-01-29T22:30:29.839622Z] Loop 3304: Loss: 1.83e-03, Avg Return: 0.458, Regret: 0.3507, Entropy: 0.0801 +[2026-01-29T22:30:31.000981Z] Loop 3305: Loss: 2.29e-03, Avg Return: 0.457, Regret: 0.3507, Entropy: 0.0869 +[2026-01-29T22:30:32.163387Z] Loop 3306: Loss: 2.32e-03, Avg Return: 0.448, Regret: 0.3507, Entropy: 0.0862 +[2026-01-29T22:30:33.325119Z] Loop 3307: Loss: 2.59e-03, Avg Return: 0.453, Regret: 0.3507, Entropy: 0.0918 +[2026-01-29T22:30:34.485733Z] Loop 3308: Loss: 2.71e-03, Avg Return: 0.444, Regret: 0.3507, Entropy: 0.0877 +[2026-01-29T22:30:35.647331Z] Loop 3309: Loss: 2.70e-03, Avg Return: 0.443, Regret: 0.3507, Entropy: 0.0899 +[2026-01-29T22:30:36.855125Z] Loop 3310: Loss: 3.33e-03, Avg Return: 0.443, Regret: 0.3617, Entropy: 0.0895 +[2026-01-29T22:30:38.016953Z] Loop 3311: Loss: 3.15e-03, Avg Return: 0.437, Regret: 0.3617, Entropy: 0.0926 +[2026-01-29T22:30:39.178233Z] Loop 3312: Loss: 2.99e-03, Avg Return: 0.450, Regret: 0.3617, Entropy: 0.0855 +[2026-01-29T22:30:40.342572Z] Loop 3313: Loss: 2.75e-03, Avg Return: 0.447, Regret: 0.3617, Entropy: 0.0807 +[2026-01-29T22:30:41.505148Z] Loop 3314: Loss: 2.38e-03, Avg Return: 0.451, Regret: 0.3617, Entropy: 0.0726 +[2026-01-29T22:30:42.667131Z] Loop 3315: Loss: 1.90e-03, Avg Return: 0.453, Regret: 0.3617, Entropy: 0.0693 +[2026-01-29T22:30:43.828722Z] Loop 3316: Loss: 1.72e-03, Avg Return: 0.455, Regret: 0.3617, Entropy: 0.0719 +[2026-01-29T22:30:44.989040Z] Loop 3317: Loss: 1.28e-03, Avg Return: 0.456, Regret: 0.3617, Entropy: 0.0647 +[2026-01-29T22:30:46.150148Z] Loop 3318: Loss: 1.32e-03, Avg Return: 0.451, Regret: 0.3617, Entropy: 0.0686 +[2026-01-29T22:30:47.314914Z] Loop 3319: Loss: 1.16e-03, Avg Return: 0.453, Regret: 0.3617, Entropy: 0.0626 +[2026-01-29T22:30:48.522377Z] Loop 3320: Loss: 1.07e-03, Avg Return: 0.452, Regret: 0.3507, Entropy: 0.0602 +[2026-01-29T22:30:49.684061Z] Loop 3321: Loss: 1.12e-03, Avg Return: 0.463, Regret: 0.3507, Entropy: 0.0613 +[2026-01-29T22:30:50.846665Z] Loop 3322: Loss: 1.17e-03, Avg Return: 0.456, Regret: 0.3507, Entropy: 0.0551 +[2026-01-29T22:30:52.012041Z] Loop 3323: Loss: 7.87e-04, Avg Return: 0.451, Regret: 0.3507, Entropy: 0.0599 +[2026-01-29T22:30:53.174336Z] Loop 3324: Loss: 1.06e-03, Avg Return: 0.452, Regret: 0.3507, Entropy: 0.0602 +[2026-01-29T22:30:54.337067Z] Loop 3325: Loss: 9.63e-04, Avg Return: 0.459, Regret: 0.3507, Entropy: 0.0672 +[2026-01-29T22:30:55.498325Z] Loop 3326: Loss: 1.22e-03, Avg Return: 0.455, Regret: 0.3507, Entropy: 0.0694 +[2026-01-29T22:30:56.661099Z] Loop 3327: Loss: 1.13e-03, Avg Return: 0.451, Regret: 0.3507, Entropy: 0.0595 +[2026-01-29T22:30:57.822996Z] Loop 3328: Loss: 8.96e-04, Avg Return: 0.444, Regret: 0.3507, Entropy: 0.0658 +[2026-01-29T22:30:58.984270Z] Loop 3329: Loss: 8.16e-04, Avg Return: 0.448, Regret: 0.3507, Entropy: 0.0620 +[2026-01-29T22:31:00.193352Z] Loop 3330: Loss: 9.68e-04, Avg Return: 0.449, Regret: 0.3511, Entropy: 0.0662 +[2026-01-29T22:31:01.355530Z] Loop 3331: Loss: 9.99e-04, Avg Return: 0.459, Regret: 0.3511, Entropy: 0.0657 +[2026-01-29T22:31:02.517609Z] Loop 3332: Loss: 1.20e-03, Avg Return: 0.454, Regret: 0.3511, Entropy: 0.0656 +[2026-01-29T22:31:03.677501Z] Loop 3333: Loss: 1.09e-03, Avg Return: 0.453, Regret: 0.3511, Entropy: 0.0543 +[2026-01-29T22:31:04.838639Z] Loop 3334: Loss: 1.18e-03, Avg Return: 0.458, Regret: 0.3511, Entropy: 0.0510 +[2026-01-29T22:31:06.000089Z] Loop 3335: Loss: 1.42e-03, Avg Return: 0.459, Regret: 0.3511, Entropy: 0.0565 +[2026-01-29T22:31:07.161458Z] Loop 3336: Loss: 2.32e-03, Avg Return: 0.464, Regret: 0.3511, Entropy: 0.0634 +[2026-01-29T22:31:08.323047Z] Loop 3337: Loss: 2.39e-03, Avg Return: 0.456, Regret: 0.3511, Entropy: 0.0705 +[2026-01-29T22:31:09.489784Z] Loop 3338: Loss: 3.01e-03, Avg Return: 0.454, Regret: 0.3511, Entropy: 0.0742 +[2026-01-29T22:31:10.651130Z] Loop 3339: Loss: 2.77e-03, Avg Return: 0.454, Regret: 0.3511, Entropy: 0.0718 +[2026-01-29T22:31:11.859266Z] Loop 3340: Loss: 3.02e-03, Avg Return: 0.456, Regret: 0.3521, Entropy: 0.0734 +[2026-01-29T22:31:13.020512Z] Loop 3341: Loss: 2.40e-03, Avg Return: 0.451, Regret: 0.3521, Entropy: 0.0640 +[2026-01-29T22:31:14.180866Z] Loop 3342: Loss: 1.68e-03, Avg Return: 0.457, Regret: 0.3521, Entropy: 0.0522 +[2026-01-29T22:31:15.341935Z] Loop 3343: Loss: 1.34e-03, Avg Return: 0.453, Regret: 0.3521, Entropy: 0.0507 +[2026-01-29T22:31:16.503993Z] Loop 3344: Loss: 9.69e-04, Avg Return: 0.458, Regret: 0.3521, Entropy: 0.0483 +[2026-01-29T22:31:17.664763Z] Loop 3345: Loss: 1.03e-03, Avg Return: 0.453, Regret: 0.3521, Entropy: 0.0505 +[2026-01-29T22:31:18.826876Z] Loop 3346: Loss: 9.34e-04, Avg Return: 0.452, Regret: 0.3521, Entropy: 0.0560 +[2026-01-29T22:31:19.987441Z] Loop 3347: Loss: 1.24e-03, Avg Return: 0.455, Regret: 0.3521, Entropy: 0.0566 +[2026-01-29T22:31:21.148352Z] Loop 3348: Loss: 1.20e-03, Avg Return: 0.456, Regret: 0.3521, Entropy: 0.0603 +[2026-01-29T22:31:22.310213Z] Loop 3349: Loss: 1.07e-03, Avg Return: 0.450, Regret: 0.3521, Entropy: 0.0660 +[2026-01-29T22:31:23.515211Z] Loop 3350: Loss: 1.04e-03, Avg Return: 0.452, Regret: 0.3510, Entropy: 0.0557 +[2026-01-29T22:31:24.676662Z] Loop 3351: Loss: 7.46e-04, Avg Return: 0.449, Regret: 0.3510, Entropy: 0.0585 +[2026-01-29T22:31:25.837719Z] Loop 3352: Loss: 7.06e-04, Avg Return: 0.452, Regret: 0.3510, Entropy: 0.0622 +[2026-01-29T22:31:26.999520Z] Loop 3353: Loss: 6.72e-04, Avg Return: 0.446, Regret: 0.3510, Entropy: 0.0587 +[2026-01-29T22:31:28.163296Z] Loop 3354: Loss: 8.40e-04, Avg Return: 0.454, Regret: 0.3510, Entropy: 0.0579 +[2026-01-29T22:31:29.325089Z] Loop 3355: Loss: 8.49e-04, Avg Return: 0.452, Regret: 0.3510, Entropy: 0.0575 +[2026-01-29T22:31:30.486456Z] Loop 3356: Loss: 1.02e-03, Avg Return: 0.454, Regret: 0.3510, Entropy: 0.0621 +[2026-01-29T22:31:31.647069Z] Loop 3357: Loss: 1.24e-03, Avg Return: 0.455, Regret: 0.3510, Entropy: 0.0643 +[2026-01-29T22:31:32.811499Z] Loop 3358: Loss: 1.15e-03, Avg Return: 0.451, Regret: 0.3510, Entropy: 0.0641 +[2026-01-29T22:31:33.974761Z] Loop 3359: Loss: 7.73e-04, Avg Return: 0.450, Regret: 0.3510, Entropy: 0.0611 +[2026-01-29T22:31:35.186226Z] Loop 3360: Loss: 5.76e-04, Avg Return: 0.446, Regret: 0.3518, Entropy: 0.0581 +[2026-01-29T22:31:36.347065Z] Loop 3361: Loss: 5.73e-04, Avg Return: 0.455, Regret: 0.3518, Entropy: 0.0589 +[2026-01-29T22:31:37.508660Z] Loop 3362: Loss: 6.60e-04, Avg Return: 0.452, Regret: 0.3518, Entropy: 0.0671 +[2026-01-29T22:31:38.668238Z] Loop 3363: Loss: 1.09e-03, Avg Return: 0.454, Regret: 0.3518, Entropy: 0.0678 +[2026-01-29T22:31:39.833013Z] Loop 3364: Loss: 1.20e-03, Avg Return: 0.454, Regret: 0.3518, Entropy: 0.0692 +[2026-01-29T22:31:41.002225Z] Loop 3365: Loss: 1.64e-03, Avg Return: 0.453, Regret: 0.3518, Entropy: 0.0772 +[2026-01-29T22:31:42.164279Z] Loop 3366: Loss: 1.66e-03, Avg Return: 0.453, Regret: 0.3518, Entropy: 0.0775 +[2026-01-29T22:31:43.326663Z] Loop 3367: Loss: 1.70e-03, Avg Return: 0.458, Regret: 0.3518, Entropy: 0.0783 +[2026-01-29T22:31:44.489303Z] Loop 3368: Loss: 1.91e-03, Avg Return: 0.451, Regret: 0.3518, Entropy: 0.0848 +[2026-01-29T22:31:45.650942Z] Loop 3369: Loss: 1.68e-03, Avg Return: 0.451, Regret: 0.3518, Entropy: 0.0763 +[2026-01-29T22:31:46.861532Z] Loop 3370: Loss: 1.35e-03, Avg Return: 0.457, Regret: 0.3522, Entropy: 0.0713 +[2026-01-29T22:31:48.028098Z] Loop 3371: Loss: 1.08e-03, Avg Return: 0.449, Regret: 0.3522, Entropy: 0.0666 +[2026-01-29T22:31:49.192953Z] Loop 3372: Loss: 7.64e-04, Avg Return: 0.444, Regret: 0.3522, Entropy: 0.0619 +[2026-01-29T22:31:50.353963Z] Loop 3373: Loss: 7.76e-04, Avg Return: 0.458, Regret: 0.3522, Entropy: 0.0535 +[2026-01-29T22:31:51.515369Z] Loop 3374: Loss: 5.35e-04, Avg Return: 0.449, Regret: 0.3522, Entropy: 0.0553 +[2026-01-29T22:31:52.676732Z] Loop 3375: Loss: 5.58e-04, Avg Return: 0.456, Regret: 0.3522, Entropy: 0.0570 +[2026-01-29T22:31:53.837613Z] Loop 3376: Loss: 6.17e-04, Avg Return: 0.458, Regret: 0.3522, Entropy: 0.0551 +[2026-01-29T22:31:54.999252Z] Loop 3377: Loss: 4.89e-04, Avg Return: 0.459, Regret: 0.3522, Entropy: 0.0604 +[2026-01-29T22:31:56.161464Z] Loop 3378: Loss: 5.02e-04, Avg Return: 0.452, Regret: 0.3522, Entropy: 0.0619 +[2026-01-29T22:31:57.328021Z] Loop 3379: Loss: 5.06e-04, Avg Return: 0.458, Regret: 0.3522, Entropy: 0.0586 +[2026-01-29T22:31:58.538925Z] Loop 3380: Loss: 5.60e-04, Avg Return: 0.455, Regret: 0.3510, Entropy: 0.0571 +[2026-01-29T22:31:59.700618Z] Loop 3381: Loss: 5.53e-04, Avg Return: 0.457, Regret: 0.3510, Entropy: 0.0566 +[2026-01-29T22:32:00.863139Z] Loop 3382: Loss: 5.55e-04, Avg Return: 0.455, Regret: 0.3510, Entropy: 0.0572 +[2026-01-29T22:32:02.023608Z] Loop 3383: Loss: 5.57e-04, Avg Return: 0.453, Regret: 0.3510, Entropy: 0.0557 +[2026-01-29T22:32:03.185289Z] Loop 3384: Loss: 5.39e-04, Avg Return: 0.455, Regret: 0.3510, Entropy: 0.0607 +[2026-01-29T22:32:04.345088Z] Loop 3385: Loss: 5.98e-04, Avg Return: 0.458, Regret: 0.3510, Entropy: 0.0544 +[2026-01-29T22:32:05.506103Z] Loop 3386: Loss: 6.65e-04, Avg Return: 0.452, Regret: 0.3510, Entropy: 0.0557 +[2026-01-29T22:32:06.665679Z] Loop 3387: Loss: 7.90e-04, Avg Return: 0.448, Regret: 0.3510, Entropy: 0.0556 +[2026-01-29T22:32:07.825859Z] Loop 3388: Loss: 7.70e-04, Avg Return: 0.455, Regret: 0.3510, Entropy: 0.0551 +[2026-01-29T22:32:08.987272Z] Loop 3389: Loss: 7.74e-04, Avg Return: 0.446, Regret: 0.3510, Entropy: 0.0655 +[2026-01-29T22:32:10.194763Z] Loop 3390: Loss: 6.49e-04, Avg Return: 0.449, Regret: 0.3506, Entropy: 0.0548 +[2026-01-29T22:32:11.359119Z] Loop 3391: Loss: 7.47e-04, Avg Return: 0.449, Regret: 0.3506, Entropy: 0.0598 +[2026-01-29T22:32:12.521336Z] Loop 3392: Loss: 6.70e-04, Avg Return: 0.459, Regret: 0.3506, Entropy: 0.0561 +[2026-01-29T22:32:13.685690Z] Loop 3393: Loss: 6.83e-04, Avg Return: 0.454, Regret: 0.3506, Entropy: 0.0527 +[2026-01-29T22:32:14.847461Z] Loop 3394: Loss: 5.93e-04, Avg Return: 0.450, Regret: 0.3506, Entropy: 0.0581 +[2026-01-29T22:32:16.009394Z] Loop 3395: Loss: 5.08e-04, Avg Return: 0.447, Regret: 0.3506, Entropy: 0.0587 +[2026-01-29T22:32:17.173487Z] Loop 3396: Loss: 6.11e-04, Avg Return: 0.453, Regret: 0.3506, Entropy: 0.0513 +[2026-01-29T22:32:18.335425Z] Loop 3397: Loss: 5.39e-04, Avg Return: 0.451, Regret: 0.3506, Entropy: 0.0571 +[2026-01-29T22:32:19.496952Z] Loop 3398: Loss: 4.60e-04, Avg Return: 0.452, Regret: 0.3506, Entropy: 0.0511 +[2026-01-29T22:32:20.657193Z] Loop 3399: Loss: 4.82e-04, Avg Return: 0.451, Regret: 0.3506, Entropy: 0.0641 +[2026-01-29T22:32:21.865035Z] Loop 3400: Loss: 4.72e-04, Avg Return: 0.454, Regret: 0.3507, Entropy: 0.0507 +[2026-01-29T22:32:23.026151Z] Loop 3401: Loss: 5.45e-04, Avg Return: 0.454, Regret: 0.3507, Entropy: 0.0528 +[2026-01-29T22:32:24.187798Z] Loop 3402: Loss: 5.30e-04, Avg Return: 0.451, Regret: 0.3507, Entropy: 0.0517 +[2026-01-29T22:32:25.349178Z] Loop 3403: Loss: 6.20e-04, Avg Return: 0.456, Regret: 0.3507, Entropy: 0.0524 +[2026-01-29T22:32:26.510044Z] Loop 3404: Loss: 5.11e-04, Avg Return: 0.456, Regret: 0.3507, Entropy: 0.0526 +[2026-01-29T22:32:27.672031Z] Loop 3405: Loss: 4.86e-04, Avg Return: 0.451, Regret: 0.3507, Entropy: 0.0531 +[2026-01-29T22:32:28.836208Z] Loop 3406: Loss: 5.95e-04, Avg Return: 0.459, Regret: 0.3507, Entropy: 0.0552 +[2026-01-29T22:32:29.999980Z] Loop 3407: Loss: 4.93e-04, Avg Return: 0.451, Regret: 0.3507, Entropy: 0.0559 +[2026-01-29T22:32:31.163868Z] Loop 3408: Loss: 5.61e-04, Avg Return: 0.446, Regret: 0.3507, Entropy: 0.0577 +[2026-01-29T22:32:32.324840Z] Loop 3409: Loss: 4.29e-04, Avg Return: 0.453, Regret: 0.3507, Entropy: 0.0532 +[2026-01-29T22:32:33.537479Z] Loop 3410: Loss: 4.38e-04, Avg Return: 0.457, Regret: 0.3506, Entropy: 0.0548 +[2026-01-29T22:32:34.699631Z] Loop 3411: Loss: 4.56e-04, Avg Return: 0.447, Regret: 0.3506, Entropy: 0.0560 +[2026-01-29T22:32:35.861320Z] Loop 3412: Loss: 4.32e-04, Avg Return: 0.450, Regret: 0.3506, Entropy: 0.0599 +[2026-01-29T22:32:37.022260Z] Loop 3413: Loss: 5.79e-04, Avg Return: 0.451, Regret: 0.3506, Entropy: 0.0623 +[2026-01-29T22:32:38.183952Z] Loop 3414: Loss: 7.92e-04, Avg Return: 0.452, Regret: 0.3506, Entropy: 0.0553 +[2026-01-29T22:32:39.343885Z] Loop 3415: Loss: 1.05e-03, Avg Return: 0.454, Regret: 0.3506, Entropy: 0.0607 +[2026-01-29T22:32:40.505122Z] Loop 3416: Loss: 1.18e-03, Avg Return: 0.455, Regret: 0.3506, Entropy: 0.0649 +[2026-01-29T22:32:41.667184Z] Loop 3417: Loss: 1.60e-03, Avg Return: 0.451, Regret: 0.3506, Entropy: 0.0710 +[2026-01-29T22:32:42.827583Z] Loop 3418: Loss: 1.42e-03, Avg Return: 0.455, Regret: 0.3506, Entropy: 0.0649 +[2026-01-29T22:32:43.993837Z] Loop 3419: Loss: 1.51e-03, Avg Return: 0.447, Regret: 0.3506, Entropy: 0.0658 +[2026-01-29T22:32:45.204582Z] Loop 3420: Loss: 1.84e-03, Avg Return: 0.452, Regret: 0.3509, Entropy: 0.0737 +[2026-01-29T22:32:46.366010Z] Loop 3421: Loss: 1.95e-03, Avg Return: 0.447, Regret: 0.3509, Entropy: 0.0791 +[2026-01-29T22:32:47.526834Z] Loop 3422: Loss: 1.68e-03, Avg Return: 0.456, Regret: 0.3509, Entropy: 0.0764 +[2026-01-29T22:32:48.688925Z] Loop 3423: Loss: 1.51e-03, Avg Return: 0.454, Regret: 0.3509, Entropy: 0.0741 +[2026-01-29T22:32:49.850783Z] Loop 3424: Loss: 1.45e-03, Avg Return: 0.450, Regret: 0.3509, Entropy: 0.0680 +[2026-01-29T22:32:51.012044Z] Loop 3425: Loss: 1.33e-03, Avg Return: 0.451, Regret: 0.3509, Entropy: 0.0682 +[2026-01-29T22:32:52.174912Z] Loop 3426: Loss: 1.22e-03, Avg Return: 0.454, Regret: 0.3509, Entropy: 0.0684 +[2026-01-29T22:32:53.335102Z] Loop 3427: Loss: 1.35e-03, Avg Return: 0.455, Regret: 0.3509, Entropy: 0.0718 +[2026-01-29T22:32:54.496508Z] Loop 3428: Loss: 1.46e-03, Avg Return: 0.446, Regret: 0.3509, Entropy: 0.0662 +[2026-01-29T22:32:55.657882Z] Loop 3429: Loss: 1.81e-03, Avg Return: 0.450, Regret: 0.3509, Entropy: 0.0751 +[2026-01-29T22:32:56.866436Z] Loop 3430: Loss: 1.78e-03, Avg Return: 0.451, Regret: 0.3507, Entropy: 0.0755 +[2026-01-29T22:32:58.030174Z] Loop 3431: Loss: 1.46e-03, Avg Return: 0.450, Regret: 0.3507, Entropy: 0.0701 +[2026-01-29T22:32:59.191045Z] Loop 3432: Loss: 1.28e-03, Avg Return: 0.451, Regret: 0.3507, Entropy: 0.0662 +[2026-01-29T22:33:00.352525Z] Loop 3433: Loss: 1.19e-03, Avg Return: 0.448, Regret: 0.3507, Entropy: 0.0645 +[2026-01-29T22:33:01.513663Z] Loop 3434: Loss: 9.58e-04, Avg Return: 0.458, Regret: 0.3507, Entropy: 0.0557 +[2026-01-29T22:33:02.675858Z] Loop 3435: Loss: 6.36e-04, Avg Return: 0.451, Regret: 0.3507, Entropy: 0.0563 +[2026-01-29T22:33:03.836125Z] Loop 3436: Loss: 5.95e-04, Avg Return: 0.455, Regret: 0.3507, Entropy: 0.0573 +[2026-01-29T22:33:04.997608Z] Loop 3437: Loss: 4.80e-04, Avg Return: 0.457, Regret: 0.3507, Entropy: 0.0563 +[2026-01-29T22:33:06.159461Z] Loop 3438: Loss: 6.45e-04, Avg Return: 0.449, Regret: 0.3507, Entropy: 0.0595 +[2026-01-29T22:33:07.322673Z] Loop 3439: Loss: 7.00e-04, Avg Return: 0.452, Regret: 0.3507, Entropy: 0.0571 +[2026-01-29T22:33:08.541091Z] Loop 3440: Loss: 6.84e-04, Avg Return: 0.462, Regret: 0.3506, Entropy: 0.0590 +[2026-01-29T22:33:09.701997Z] Loop 3441: Loss: 5.79e-04, Avg Return: 0.454, Regret: 0.3506, Entropy: 0.0577 +[2026-01-29T22:33:10.863592Z] Loop 3442: Loss: 5.50e-04, Avg Return: 0.450, Regret: 0.3506, Entropy: 0.0619 +[2026-01-29T22:33:12.027247Z] Loop 3443: Loss: 5.24e-04, Avg Return: 0.456, Regret: 0.3506, Entropy: 0.0571 +[2026-01-29T22:33:13.191514Z] Loop 3444: Loss: 5.01e-04, Avg Return: 0.456, Regret: 0.3506, Entropy: 0.0589 +[2026-01-29T22:33:14.355210Z] Loop 3445: Loss: 5.12e-04, Avg Return: 0.453, Regret: 0.3506, Entropy: 0.0583 +[2026-01-29T22:33:15.516828Z] Loop 3446: Loss: 5.58e-04, Avg Return: 0.457, Regret: 0.3506, Entropy: 0.0596 +[2026-01-29T22:33:16.679880Z] Loop 3447: Loss: 5.53e-04, Avg Return: 0.450, Regret: 0.3506, Entropy: 0.0539 +[2026-01-29T22:33:17.843312Z] Loop 3448: Loss: 6.23e-04, Avg Return: 0.458, Regret: 0.3506, Entropy: 0.0555 +[2026-01-29T22:33:19.004735Z] Loop 3449: Loss: 4.91e-04, Avg Return: 0.454, Regret: 0.3506, Entropy: 0.0555 +[2026-01-29T22:33:20.218404Z] Loop 3450: Loss: 5.85e-04, Avg Return: 0.453, Regret: 0.3506, Entropy: 0.0525 +[2026-01-29T22:33:21.381144Z] Loop 3451: Loss: 6.29e-04, Avg Return: 0.459, Regret: 0.3506, Entropy: 0.0600 +[2026-01-29T22:33:22.544714Z] Loop 3452: Loss: 6.10e-04, Avg Return: 0.447, Regret: 0.3506, Entropy: 0.0580 +[2026-01-29T22:33:23.706516Z] Loop 3453: Loss: 5.66e-04, Avg Return: 0.451, Regret: 0.3506, Entropy: 0.0554 +[2026-01-29T22:33:24.868505Z] Loop 3454: Loss: 6.46e-04, Avg Return: 0.455, Regret: 0.3506, Entropy: 0.0539 +[2026-01-29T22:33:26.030681Z] Loop 3455: Loss: 5.41e-04, Avg Return: 0.450, Regret: 0.3506, Entropy: 0.0567 +[2026-01-29T22:33:27.192683Z] Loop 3456: Loss: 5.89e-04, Avg Return: 0.451, Regret: 0.3506, Entropy: 0.0560 +[2026-01-29T22:33:28.356185Z] Loop 3457: Loss: 8.76e-04, Avg Return: 0.464, Regret: 0.3506, Entropy: 0.0561 +[2026-01-29T22:33:29.517254Z] Loop 3458: Loss: 7.68e-04, Avg Return: 0.455, Regret: 0.3506, Entropy: 0.0629 +[2026-01-29T22:33:30.678780Z] Loop 3459: Loss: 6.93e-04, Avg Return: 0.450, Regret: 0.3506, Entropy: 0.0560 +[2026-01-29T22:33:31.887476Z] Loop 3460: Loss: 6.85e-04, Avg Return: 0.456, Regret: 0.3506, Entropy: 0.0512 +[2026-01-29T22:33:33.048502Z] Loop 3461: Loss: 7.80e-04, Avg Return: 0.453, Regret: 0.3506, Entropy: 0.0543 +[2026-01-29T22:33:34.211703Z] Loop 3462: Loss: 6.53e-04, Avg Return: 0.449, Regret: 0.3506, Entropy: 0.0581 +[2026-01-29T22:33:35.371936Z] Loop 3463: Loss: 7.33e-04, Avg Return: 0.458, Regret: 0.3506, Entropy: 0.0584 +[2026-01-29T22:33:36.534047Z] Loop 3464: Loss: 6.62e-04, Avg Return: 0.458, Regret: 0.3506, Entropy: 0.0551 +[2026-01-29T22:33:37.695537Z] Loop 3465: Loss: 1.03e-03, Avg Return: 0.451, Regret: 0.3506, Entropy: 0.0598 +[2026-01-29T22:33:38.860001Z] Loop 3466: Loss: 1.11e-03, Avg Return: 0.457, Regret: 0.3506, Entropy: 0.0606 +[2026-01-29T22:33:40.021555Z] Loop 3467: Loss: 1.11e-03, Avg Return: 0.453, Regret: 0.3506, Entropy: 0.0636 +[2026-01-29T22:33:41.182500Z] Loop 3468: Loss: 1.23e-03, Avg Return: 0.451, Regret: 0.3506, Entropy: 0.0647 +[2026-01-29T22:33:42.344777Z] Loop 3469: Loss: 1.27e-03, Avg Return: 0.448, Regret: 0.3506, Entropy: 0.0654 +[2026-01-29T22:33:43.559368Z] Loop 3470: Loss: 1.13e-03, Avg Return: 0.454, Regret: 0.3507, Entropy: 0.0644 +[2026-01-29T22:33:44.725593Z] Loop 3471: Loss: 1.15e-03, Avg Return: 0.456, Regret: 0.3507, Entropy: 0.0657 +[2026-01-29T22:33:45.886263Z] Loop 3472: Loss: 7.72e-04, Avg Return: 0.458, Regret: 0.3507, Entropy: 0.0588 +[2026-01-29T22:33:47.047991Z] Loop 3473: Loss: 6.51e-04, Avg Return: 0.457, Regret: 0.3507, Entropy: 0.0564 +[2026-01-29T22:33:48.210006Z] Loop 3474: Loss: 5.09e-04, Avg Return: 0.456, Regret: 0.3507, Entropy: 0.0604 +[2026-01-29T22:33:49.372721Z] Loop 3475: Loss: 3.22e-04, Avg Return: 0.454, Regret: 0.3507, Entropy: 0.0549 +[2026-01-29T22:33:50.535657Z] Loop 3476: Loss: 4.34e-04, Avg Return: 0.460, Regret: 0.3507, Entropy: 0.0563 +[2026-01-29T22:33:51.698922Z] Loop 3477: Loss: 4.44e-04, Avg Return: 0.454, Regret: 0.3507, Entropy: 0.0502 +[2026-01-29T22:33:52.860194Z] Loop 3478: Loss: 5.58e-04, Avg Return: 0.450, Regret: 0.3507, Entropy: 0.0538 +[2026-01-29T22:33:54.022320Z] Loop 3479: Loss: 5.58e-04, Avg Return: 0.450, Regret: 0.3507, Entropy: 0.0594 +[2026-01-29T22:33:55.231010Z] Loop 3480: Loss: 6.69e-04, Avg Return: 0.455, Regret: 0.3506, Entropy: 0.0606 +[2026-01-29T22:33:56.392931Z] Loop 3481: Loss: 9.63e-04, Avg Return: 0.451, Regret: 0.3506, Entropy: 0.0564 +[2026-01-29T22:33:57.554289Z] Loop 3482: Loss: 8.54e-04, Avg Return: 0.452, Regret: 0.3506, Entropy: 0.0650 +[2026-01-29T22:33:58.715777Z] Loop 3483: Loss: 1.45e-03, Avg Return: 0.457, Regret: 0.3506, Entropy: 0.0685 +[2026-01-29T22:33:59.876236Z] Loop 3484: Loss: 1.68e-03, Avg Return: 0.458, Regret: 0.3506, Entropy: 0.0693 +[2026-01-29T22:34:01.037529Z] Loop 3485: Loss: 1.90e-03, Avg Return: 0.456, Regret: 0.3506, Entropy: 0.0685 +[2026-01-29T22:34:02.197858Z] Loop 3486: Loss: 1.62e-03, Avg Return: 0.451, Regret: 0.3506, Entropy: 0.0676 +[2026-01-29T22:34:03.358358Z] Loop 3487: Loss: 1.79e-03, Avg Return: 0.451, Regret: 0.3506, Entropy: 0.0688 +[2026-01-29T22:34:04.519572Z] Loop 3488: Loss: 1.53e-03, Avg Return: 0.455, Regret: 0.3506, Entropy: 0.0655 +[2026-01-29T22:34:05.680431Z] Loop 3489: Loss: 1.50e-03, Avg Return: 0.450, Regret: 0.3506, Entropy: 0.0700 +[2026-01-29T22:34:06.886155Z] Loop 3490: Loss: 1.65e-03, Avg Return: 0.459, Regret: 0.3507, Entropy: 0.0657 +[2026-01-29T22:34:08.047581Z] Loop 3491: Loss: 1.63e-03, Avg Return: 0.452, Regret: 0.3507, Entropy: 0.0737 +[2026-01-29T22:34:09.209494Z] Loop 3492: Loss: 1.75e-03, Avg Return: 0.461, Regret: 0.3507, Entropy: 0.0704 +[2026-01-29T22:34:10.370333Z] Loop 3493: Loss: 1.68e-03, Avg Return: 0.461, Regret: 0.3507, Entropy: 0.0674 +[2026-01-29T22:34:11.532241Z] Loop 3494: Loss: 1.30e-03, Avg Return: 0.449, Regret: 0.3507, Entropy: 0.0689 +[2026-01-29T22:34:12.692562Z] Loop 3495: Loss: 1.58e-03, Avg Return: 0.452, Regret: 0.3507, Entropy: 0.0649 +[2026-01-29T22:34:13.852956Z] Loop 3496: Loss: 1.48e-03, Avg Return: 0.448, Regret: 0.3507, Entropy: 0.0702 +[2026-01-29T22:34:15.014221Z] Loop 3497: Loss: 1.75e-03, Avg Return: 0.458, Regret: 0.3507, Entropy: 0.0678 +[2026-01-29T22:34:16.174666Z] Loop 3498: Loss: 2.21e-03, Avg Return: 0.455, Regret: 0.3507, Entropy: 0.0684 +[2026-01-29T22:34:17.336397Z] Loop 3499: Loss: 2.45e-03, Avg Return: 0.457, Regret: 0.3507, Entropy: 0.0679 +[2026-01-29T22:34:18.548928Z] Loop 3500: Loss: 2.28e-03, Avg Return: 0.452, Regret: 0.3515, Entropy: 0.0628 +[2026-01-29T22:34:19.710528Z] Loop 3501: Loss: 2.30e-03, Avg Return: 0.454, Regret: 0.3515, Entropy: 0.0610 +[2026-01-29T22:34:20.871097Z] Loop 3502: Loss: 2.03e-03, Avg Return: 0.453, Regret: 0.3515, Entropy: 0.0616 +[2026-01-29T22:34:22.032466Z] Loop 3503: Loss: 2.15e-03, Avg Return: 0.449, Regret: 0.3515, Entropy: 0.0622 +[2026-01-29T22:34:23.194254Z] Loop 3504: Loss: 2.13e-03, Avg Return: 0.453, Regret: 0.3515, Entropy: 0.0576 +[2026-01-29T22:34:24.355402Z] Loop 3505: Loss: 1.99e-03, Avg Return: 0.455, Regret: 0.3515, Entropy: 0.0532 +[2026-01-29T22:34:25.516944Z] Loop 3506: Loss: 1.62e-03, Avg Return: 0.458, Regret: 0.3515, Entropy: 0.0560 +[2026-01-29T22:34:26.677565Z] Loop 3507: Loss: 1.57e-03, Avg Return: 0.452, Regret: 0.3515, Entropy: 0.0509 +[2026-01-29T22:34:27.838886Z] Loop 3508: Loss: 1.30e-03, Avg Return: 0.457, Regret: 0.3515, Entropy: 0.0501 +[2026-01-29T22:34:28.999024Z] Loop 3509: Loss: 1.16e-03, Avg Return: 0.458, Regret: 0.3515, Entropy: 0.0475 +[2026-01-29T22:34:30.207964Z] Loop 3510: Loss: 1.11e-03, Avg Return: 0.452, Regret: 0.3508, Entropy: 0.0481 +[2026-01-29T22:34:31.369098Z] Loop 3511: Loss: 1.17e-03, Avg Return: 0.457, Regret: 0.3508, Entropy: 0.0490 +[2026-01-29T22:34:32.530156Z] Loop 3512: Loss: 1.26e-03, Avg Return: 0.456, Regret: 0.3508, Entropy: 0.0492 +[2026-01-29T22:34:33.691206Z] Loop 3513: Loss: 1.17e-03, Avg Return: 0.453, Regret: 0.3508, Entropy: 0.0475 +[2026-01-29T22:34:34.851542Z] Loop 3514: Loss: 1.11e-03, Avg Return: 0.459, Regret: 0.3508, Entropy: 0.0474 +[2026-01-29T22:34:36.012774Z] Loop 3515: Loss: 1.01e-03, Avg Return: 0.443, Regret: 0.3508, Entropy: 0.0485 +[2026-01-29T22:34:37.173088Z] Loop 3516: Loss: 1.42e-03, Avg Return: 0.454, Regret: 0.3508, Entropy: 0.0487 +[2026-01-29T22:34:38.333817Z] Loop 3517: Loss: 1.56e-03, Avg Return: 0.457, Regret: 0.3508, Entropy: 0.0515 +[2026-01-29T22:34:39.493762Z] Loop 3518: Loss: 1.46e-03, Avg Return: 0.441, Regret: 0.3508, Entropy: 0.0549 +[2026-01-29T22:34:40.654336Z] Loop 3519: Loss: 1.71e-03, Avg Return: 0.456, Regret: 0.3508, Entropy: 0.0531 +[2026-01-29T22:34:41.874208Z] Loop 3520: Loss: 1.61e-03, Avg Return: 0.451, Regret: 0.3512, Entropy: 0.0534 +[2026-01-29T22:34:43.035924Z] Loop 3521: Loss: 1.78e-03, Avg Return: 0.452, Regret: 0.3512, Entropy: 0.0547 +[2026-01-29T22:34:44.198157Z] Loop 3522: Loss: 1.86e-03, Avg Return: 0.449, Regret: 0.3512, Entropy: 0.0600 +[2026-01-29T22:34:45.358755Z] Loop 3523: Loss: 2.37e-03, Avg Return: 0.450, Regret: 0.3512, Entropy: 0.0709 +[2026-01-29T22:34:46.520196Z] Loop 3524: Loss: 2.65e-03, Avg Return: 0.452, Regret: 0.3512, Entropy: 0.0710 +[2026-01-29T22:34:47.682183Z] Loop 3525: Loss: 2.73e-03, Avg Return: 0.449, Regret: 0.3512, Entropy: 0.0693 +[2026-01-29T22:34:48.842700Z] Loop 3526: Loss: 2.83e-03, Avg Return: 0.454, Regret: 0.3512, Entropy: 0.0712 +[2026-01-29T22:34:50.004286Z] Loop 3527: Loss: 2.64e-03, Avg Return: 0.454, Regret: 0.3512, Entropy: 0.0669 +[2026-01-29T22:34:51.165513Z] Loop 3528: Loss: 3.00e-03, Avg Return: 0.452, Regret: 0.3512, Entropy: 0.0730 +[2026-01-29T22:34:52.330079Z] Loop 3529: Loss: 2.78e-03, Avg Return: 0.448, Regret: 0.3512, Entropy: 0.0715 +[2026-01-29T22:34:53.537285Z] Loop 3530: Loss: 2.75e-03, Avg Return: 0.451, Regret: 0.3513, Entropy: 0.0721 +[2026-01-29T22:34:54.699146Z] Loop 3531: Loss: 3.01e-03, Avg Return: 0.450, Regret: 0.3513, Entropy: 0.0752 +[2026-01-29T22:34:55.860629Z] Loop 3532: Loss: 2.97e-03, Avg Return: 0.456, Regret: 0.3513, Entropy: 0.0730 +[2026-01-29T22:34:57.023981Z] Loop 3533: Loss: 2.61e-03, Avg Return: 0.456, Regret: 0.3513, Entropy: 0.0667 +[2026-01-29T22:34:58.188318Z] Loop 3534: Loss: 2.39e-03, Avg Return: 0.463, Regret: 0.3513, Entropy: 0.0625 +[2026-01-29T22:34:59.349845Z] Loop 3535: Loss: 2.66e-03, Avg Return: 0.453, Regret: 0.3513, Entropy: 0.0680 +[2026-01-29T22:35:00.511535Z] Loop 3536: Loss: 2.41e-03, Avg Return: 0.451, Regret: 0.3513, Entropy: 0.0678 +[2026-01-29T22:35:01.672964Z] Loop 3537: Loss: 2.37e-03, Avg Return: 0.448, Regret: 0.3513, Entropy: 0.0574 +[2026-01-29T22:35:02.836326Z] Loop 3538: Loss: 2.00e-03, Avg Return: 0.448, Regret: 0.3513, Entropy: 0.0579 +[2026-01-29T22:35:03.998861Z] Loop 3539: Loss: 1.95e-03, Avg Return: 0.448, Regret: 0.3513, Entropy: 0.0562 +[2026-01-29T22:35:05.208107Z] Loop 3540: Loss: 1.92e-03, Avg Return: 0.453, Regret: 0.3517, Entropy: 0.0563 +[2026-01-29T22:35:06.370137Z] Loop 3541: Loss: 2.03e-03, Avg Return: 0.461, Regret: 0.3517, Entropy: 0.0554 +[2026-01-29T22:35:07.531713Z] Loop 3542: Loss: 1.76e-03, Avg Return: 0.452, Regret: 0.3517, Entropy: 0.0511 +[2026-01-29T22:35:08.694235Z] Loop 3543: Loss: 2.08e-03, Avg Return: 0.458, Regret: 0.3517, Entropy: 0.0579 +[2026-01-29T22:35:09.855878Z] Loop 3544: Loss: 1.90e-03, Avg Return: 0.447, Regret: 0.3517, Entropy: 0.0586 +[2026-01-29T22:35:11.017257Z] Loop 3545: Loss: 1.83e-03, Avg Return: 0.459, Regret: 0.3517, Entropy: 0.0550 +[2026-01-29T22:35:12.179456Z] Loop 3546: Loss: 2.46e-03, Avg Return: 0.457, Regret: 0.3517, Entropy: 0.0601 +[2026-01-29T22:35:13.341317Z] Loop 3547: Loss: 2.38e-03, Avg Return: 0.454, Regret: 0.3517, Entropy: 0.0656 +[2026-01-29T22:35:14.502664Z] Loop 3548: Loss: 2.66e-03, Avg Return: 0.445, Regret: 0.3517, Entropy: 0.0663 +[2026-01-29T22:35:15.662775Z] Loop 3549: Loss: 2.52e-03, Avg Return: 0.447, Regret: 0.3517, Entropy: 0.0676 +[2026-01-29T22:35:16.869351Z] Loop 3550: Loss: 2.75e-03, Avg Return: 0.455, Regret: 0.3508, Entropy: 0.0647 +[2026-01-29T22:35:18.030932Z] Loop 3551: Loss: 2.61e-03, Avg Return: 0.449, Regret: 0.3508, Entropy: 0.0620 +[2026-01-29T22:35:19.193348Z] Loop 3552: Loss: 2.18e-03, Avg Return: 0.450, Regret: 0.3508, Entropy: 0.0597 +[2026-01-29T22:35:20.353816Z] Loop 3553: Loss: 2.16e-03, Avg Return: 0.450, Regret: 0.3508, Entropy: 0.0574 +[2026-01-29T22:35:21.515472Z] Loop 3554: Loss: 2.34e-03, Avg Return: 0.453, Regret: 0.3508, Entropy: 0.0605 +[2026-01-29T22:35:22.677549Z] Loop 3555: Loss: 2.16e-03, Avg Return: 0.449, Regret: 0.3508, Entropy: 0.0597 +[2026-01-29T22:35:23.839508Z] Loop 3556: Loss: 1.77e-03, Avg Return: 0.451, Regret: 0.3508, Entropy: 0.0517 +[2026-01-29T22:35:25.001381Z] Loop 3557: Loss: 1.41e-03, Avg Return: 0.452, Regret: 0.3508, Entropy: 0.0464 +[2026-01-29T22:35:26.161625Z] Loop 3558: Loss: 1.23e-03, Avg Return: 0.454, Regret: 0.3508, Entropy: 0.0457 +[2026-01-29T22:35:27.324207Z] Loop 3559: Loss: 1.09e-03, Avg Return: 0.461, Regret: 0.3508, Entropy: 0.0451 +[2026-01-29T22:35:28.531188Z] Loop 3560: Loss: 9.98e-04, Avg Return: 0.455, Regret: 0.3509, Entropy: 0.0428 +[2026-01-29T22:35:29.694967Z] Loop 3561: Loss: 1.06e-03, Avg Return: 0.446, Regret: 0.3509, Entropy: 0.0411 +[2026-01-29T22:35:30.855385Z] Loop 3562: Loss: 9.87e-04, Avg Return: 0.453, Regret: 0.3509, Entropy: 0.0419 +[2026-01-29T22:35:32.017178Z] Loop 3563: Loss: 9.91e-04, Avg Return: 0.449, Regret: 0.3509, Entropy: 0.0421 +[2026-01-29T22:35:33.181068Z] Loop 3564: Loss: 9.57e-04, Avg Return: 0.449, Regret: 0.3509, Entropy: 0.0401 +[2026-01-29T22:35:34.343155Z] Loop 3565: Loss: 9.34e-04, Avg Return: 0.450, Regret: 0.3509, Entropy: 0.0419 +[2026-01-29T22:35:35.504457Z] Loop 3566: Loss: 9.13e-04, Avg Return: 0.450, Regret: 0.3509, Entropy: 0.0416 +[2026-01-29T22:35:36.665929Z] Loop 3567: Loss: 9.05e-04, Avg Return: 0.457, Regret: 0.3509, Entropy: 0.0397 +[2026-01-29T22:35:37.827060Z] Loop 3568: Loss: 9.51e-04, Avg Return: 0.453, Regret: 0.3509, Entropy: 0.0442 +[2026-01-29T22:35:38.990660Z] Loop 3569: Loss: 1.09e-03, Avg Return: 0.453, Regret: 0.3509, Entropy: 0.0430 +[2026-01-29T22:35:40.199379Z] Loop 3570: Loss: 1.07e-03, Avg Return: 0.456, Regret: 0.3507, Entropy: 0.0464 +[2026-01-29T22:35:41.360444Z] Loop 3571: Loss: 9.77e-04, Avg Return: 0.460, Regret: 0.3507, Entropy: 0.0428 +[2026-01-29T22:35:42.522368Z] Loop 3572: Loss: 9.67e-04, Avg Return: 0.452, Regret: 0.3507, Entropy: 0.0445 +[2026-01-29T22:35:43.684150Z] Loop 3573: Loss: 1.12e-03, Avg Return: 0.454, Regret: 0.3507, Entropy: 0.0410 +[2026-01-29T22:35:44.844921Z] Loop 3574: Loss: 1.05e-03, Avg Return: 0.456, Regret: 0.3507, Entropy: 0.0451 +[2026-01-29T22:35:46.007260Z] Loop 3575: Loss: 1.08e-03, Avg Return: 0.454, Regret: 0.3507, Entropy: 0.0424 +[2026-01-29T22:35:47.169364Z] Loop 3576: Loss: 1.01e-03, Avg Return: 0.452, Regret: 0.3507, Entropy: 0.0421 +[2026-01-29T22:35:48.330191Z] Loop 3577: Loss: 1.05e-03, Avg Return: 0.447, Regret: 0.3507, Entropy: 0.0431 +[2026-01-29T22:35:49.491863Z] Loop 3578: Loss: 9.80e-04, Avg Return: 0.451, Regret: 0.3507, Entropy: 0.0406 +[2026-01-29T22:35:50.653007Z] Loop 3579: Loss: 1.12e-03, Avg Return: 0.452, Regret: 0.3507, Entropy: 0.0411 +[2026-01-29T22:35:51.860410Z] Loop 3580: Loss: 1.19e-03, Avg Return: 0.448, Regret: 0.3507, Entropy: 0.0435 +[2026-01-29T22:35:53.022773Z] Loop 3581: Loss: 1.10e-03, Avg Return: 0.451, Regret: 0.3507, Entropy: 0.0383 +[2026-01-29T22:35:54.184529Z] Loop 3582: Loss: 1.14e-03, Avg Return: 0.449, Regret: 0.3507, Entropy: 0.0393 +[2026-01-29T22:35:55.345234Z] Loop 3583: Loss: 1.05e-03, Avg Return: 0.449, Regret: 0.3507, Entropy: 0.0446 +[2026-01-29T22:35:56.507822Z] Loop 3584: Loss: 9.75e-04, Avg Return: 0.449, Regret: 0.3507, Entropy: 0.0429 +[2026-01-29T22:35:57.670069Z] Loop 3585: Loss: 9.06e-04, Avg Return: 0.447, Regret: 0.3507, Entropy: 0.0433 +[2026-01-29T22:35:58.831151Z] Loop 3586: Loss: 1.09e-03, Avg Return: 0.456, Regret: 0.3507, Entropy: 0.0409 +[2026-01-29T22:35:59.992938Z] Loop 3587: Loss: 1.05e-03, Avg Return: 0.447, Regret: 0.3507, Entropy: 0.0469 +[2026-01-29T22:36:01.153099Z] Loop 3588: Loss: 8.96e-04, Avg Return: 0.457, Regret: 0.3507, Entropy: 0.0402 +[2026-01-29T22:36:02.314588Z] Loop 3589: Loss: 9.82e-04, Avg Return: 0.458, Regret: 0.3507, Entropy: 0.0392 +[2026-01-29T22:36:03.520243Z] Loop 3590: Loss: 9.85e-04, Avg Return: 0.452, Regret: 0.3507, Entropy: 0.0461 +[2026-01-29T22:36:04.681813Z] Loop 3591: Loss: 1.08e-03, Avg Return: 0.448, Regret: 0.3507, Entropy: 0.0448 +[2026-01-29T22:36:05.842459Z] Loop 3592: Loss: 8.85e-04, Avg Return: 0.447, Regret: 0.3507, Entropy: 0.0390 +[2026-01-29T22:36:07.003842Z] Loop 3593: Loss: 1.02e-03, Avg Return: 0.453, Regret: 0.3507, Entropy: 0.0426 +[2026-01-29T22:36:08.165069Z] Loop 3594: Loss: 1.06e-03, Avg Return: 0.456, Regret: 0.3507, Entropy: 0.0439 +[2026-01-29T22:36:09.325084Z] Loop 3595: Loss: 1.06e-03, Avg Return: 0.444, Regret: 0.3507, Entropy: 0.0444 +[2026-01-29T22:36:10.486774Z] Loop 3596: Loss: 1.29e-03, Avg Return: 0.453, Regret: 0.3507, Entropy: 0.0454 +[2026-01-29T22:36:11.647114Z] Loop 3597: Loss: 1.32e-03, Avg Return: 0.448, Regret: 0.3507, Entropy: 0.0478 +[2026-01-29T22:36:12.808674Z] Loop 3598: Loss: 1.38e-03, Avg Return: 0.450, Regret: 0.3507, Entropy: 0.0471 +[2026-01-29T22:36:13.969514Z] Loop 3599: Loss: 1.52e-03, Avg Return: 0.456, Regret: 0.3507, Entropy: 0.0503 +[2026-01-29T22:36:15.175926Z] Loop 3600: Loss: 1.64e-03, Avg Return: 0.456, Regret: 0.3506, Entropy: 0.0474 +[2026-01-29T22:36:16.339924Z] Loop 3601: Loss: 1.47e-03, Avg Return: 0.456, Regret: 0.3506, Entropy: 0.0490 +[2026-01-29T22:36:17.501051Z] Loop 3602: Loss: 1.30e-03, Avg Return: 0.456, Regret: 0.3506, Entropy: 0.0455 +[2026-01-29T22:36:18.662637Z] Loop 3603: Loss: 1.35e-03, Avg Return: 0.456, Regret: 0.3506, Entropy: 0.0436 +[2026-01-29T22:36:19.823770Z] Loop 3604: Loss: 1.46e-03, Avg Return: 0.451, Regret: 0.3506, Entropy: 0.0453 +[2026-01-29T22:36:20.986313Z] Loop 3605: Loss: 1.40e-03, Avg Return: 0.450, Regret: 0.3506, Entropy: 0.0447 +[2026-01-29T22:36:22.147936Z] Loop 3606: Loss: 1.11e-03, Avg Return: 0.455, Regret: 0.3506, Entropy: 0.0433 +[2026-01-29T22:36:23.309046Z] Loop 3607: Loss: 1.11e-03, Avg Return: 0.455, Regret: 0.3506, Entropy: 0.0425 +[2026-01-29T22:36:24.470455Z] Loop 3608: Loss: 1.07e-03, Avg Return: 0.454, Regret: 0.3506, Entropy: 0.0458 +[2026-01-29T22:36:25.632887Z] Loop 3609: Loss: 9.97e-04, Avg Return: 0.453, Regret: 0.3506, Entropy: 0.0432 +[2026-01-29T22:36:26.850547Z] Loop 3610: Loss: 1.01e-03, Avg Return: 0.449, Regret: 0.3507, Entropy: 0.0438 +[2026-01-29T22:36:28.012789Z] Loop 3611: Loss: 1.18e-03, Avg Return: 0.458, Regret: 0.3507, Entropy: 0.0452 +[2026-01-29T22:36:29.175783Z] Loop 3612: Loss: 1.21e-03, Avg Return: 0.454, Regret: 0.3507, Entropy: 0.0463 +[2026-01-29T22:36:30.337228Z] Loop 3613: Loss: 1.39e-03, Avg Return: 0.461, Regret: 0.3507, Entropy: 0.0461 +[2026-01-29T22:36:31.499289Z] Loop 3614: Loss: 1.98e-03, Avg Return: 0.453, Regret: 0.3507, Entropy: 0.0549 +[2026-01-29T22:36:32.662455Z] Loop 3615: Loss: 2.17e-03, Avg Return: 0.454, Regret: 0.3507, Entropy: 0.0576 +[2026-01-29T22:36:33.823910Z] Loop 3616: Loss: 2.34e-03, Avg Return: 0.451, Regret: 0.3507, Entropy: 0.0614 +[2026-01-29T22:36:34.985904Z] Loop 3617: Loss: 2.40e-03, Avg Return: 0.445, Regret: 0.3507, Entropy: 0.0583 +[2026-01-29T22:36:36.147401Z] Loop 3618: Loss: 2.41e-03, Avg Return: 0.451, Regret: 0.3507, Entropy: 0.0613 +[2026-01-29T22:36:37.310147Z] Loop 3619: Loss: 2.59e-03, Avg Return: 0.452, Regret: 0.3507, Entropy: 0.0605 +[2026-01-29T22:36:38.524671Z] Loop 3620: Loss: 2.07e-03, Avg Return: 0.447, Regret: 0.3557, Entropy: 0.0545 +[2026-01-29T22:36:39.685383Z] Loop 3621: Loss: 2.32e-03, Avg Return: 0.446, Regret: 0.3557, Entropy: 0.0558 +[2026-01-29T22:36:40.847171Z] Loop 3622: Loss: 2.21e-03, Avg Return: 0.447, Regret: 0.3557, Entropy: 0.0567 +[2026-01-29T22:36:42.007857Z] Loop 3623: Loss: 2.21e-03, Avg Return: 0.445, Regret: 0.3557, Entropy: 0.0570 +[2026-01-29T22:36:43.169495Z] Loop 3624: Loss: 2.06e-03, Avg Return: 0.443, Regret: 0.3557, Entropy: 0.0563 +[2026-01-29T22:36:44.330327Z] Loop 3625: Loss: 2.14e-03, Avg Return: 0.446, Regret: 0.3557, Entropy: 0.0548 +[2026-01-29T22:36:45.491996Z] Loop 3626: Loss: 2.43e-03, Avg Return: 0.451, Regret: 0.3557, Entropy: 0.0571 +[2026-01-29T22:36:46.653711Z] Loop 3627: Loss: 2.32e-03, Avg Return: 0.451, Regret: 0.3557, Entropy: 0.0587 +[2026-01-29T22:36:47.815800Z] Loop 3628: Loss: 2.46e-03, Avg Return: 0.454, Regret: 0.3557, Entropy: 0.0607 +[2026-01-29T22:36:48.978039Z] Loop 3629: Loss: 2.40e-03, Avg Return: 0.444, Regret: 0.3557, Entropy: 0.0598 +[2026-01-29T22:36:50.183455Z] Loop 3630: Loss: 2.58e-03, Avg Return: 0.452, Regret: 0.3522, Entropy: 0.0643 +[2026-01-29T22:36:51.345053Z] Loop 3631: Loss: 2.40e-03, Avg Return: 0.454, Regret: 0.3522, Entropy: 0.0626 +[2026-01-29T22:36:52.505840Z] Loop 3632: Loss: 2.21e-03, Avg Return: 0.443, Regret: 0.3522, Entropy: 0.0614 +[2026-01-29T22:36:53.670441Z] Loop 3633: Loss: 2.29e-03, Avg Return: 0.455, Regret: 0.3522, Entropy: 0.0576 +[2026-01-29T22:36:54.831193Z] Loop 3634: Loss: 2.04e-03, Avg Return: 0.459, Regret: 0.3522, Entropy: 0.0562 +[2026-01-29T22:36:55.992106Z] Loop 3635: Loss: 1.93e-03, Avg Return: 0.450, Regret: 0.3522, Entropy: 0.0541 +[2026-01-29T22:36:57.155376Z] Loop 3636: Loss: 1.67e-03, Avg Return: 0.453, Regret: 0.3522, Entropy: 0.0538 +[2026-01-29T22:36:58.316874Z] Loop 3637: Loss: 1.80e-03, Avg Return: 0.452, Regret: 0.3522, Entropy: 0.0531 +[2026-01-29T22:36:59.478356Z] Loop 3638: Loss: 1.80e-03, Avg Return: 0.457, Regret: 0.3522, Entropy: 0.0522 +[2026-01-29T22:37:00.638467Z] Loop 3639: Loss: 1.73e-03, Avg Return: 0.458, Regret: 0.3522, Entropy: 0.0529 +[2026-01-29T22:37:01.845560Z] Loop 3640: Loss: 1.56e-03, Avg Return: 0.453, Regret: 0.3508, Entropy: 0.0525 +[2026-01-29T22:37:03.005575Z] Loop 3641: Loss: 1.57e-03, Avg Return: 0.453, Regret: 0.3508, Entropy: 0.0525 +[2026-01-29T22:37:04.167099Z] Loop 3642: Loss: 1.53e-03, Avg Return: 0.444, Regret: 0.3508, Entropy: 0.0504 +[2026-01-29T22:37:05.327533Z] Loop 3643: Loss: 1.57e-03, Avg Return: 0.454, Regret: 0.3508, Entropy: 0.0517 +[2026-01-29T22:37:06.488728Z] Loop 3644: Loss: 1.78e-03, Avg Return: 0.453, Regret: 0.3508, Entropy: 0.0532 +[2026-01-29T22:37:07.650743Z] Loop 3645: Loss: 1.52e-03, Avg Return: 0.450, Regret: 0.3508, Entropy: 0.0499 +[2026-01-29T22:37:08.811961Z] Loop 3646: Loss: 1.47e-03, Avg Return: 0.458, Regret: 0.3508, Entropy: 0.0459 +[2026-01-29T22:37:09.974587Z] Loop 3647: Loss: 1.70e-03, Avg Return: 0.457, Regret: 0.3508, Entropy: 0.0480 +[2026-01-29T22:37:11.135199Z] Loop 3648: Loss: 1.45e-03, Avg Return: 0.456, Regret: 0.3508, Entropy: 0.0464 +[2026-01-29T22:37:12.296452Z] Loop 3649: Loss: 1.40e-03, Avg Return: 0.454, Regret: 0.3508, Entropy: 0.0509 +[2026-01-29T22:37:13.503692Z] Loop 3650: Loss: 1.44e-03, Avg Return: 0.455, Regret: 0.3507, Entropy: 0.0513 +[2026-01-29T22:37:14.664355Z] Loop 3651: Loss: 1.46e-03, Avg Return: 0.455, Regret: 0.3507, Entropy: 0.0487 +[2026-01-29T22:37:15.824703Z] Loop 3652: Loss: 1.45e-03, Avg Return: 0.448, Regret: 0.3507, Entropy: 0.0484 +[2026-01-29T22:37:16.985354Z] Loop 3653: Loss: 1.08e-03, Avg Return: 0.449, Regret: 0.3507, Entropy: 0.0479 +[2026-01-29T22:37:18.146983Z] Loop 3654: Loss: 1.10e-03, Avg Return: 0.451, Regret: 0.3507, Entropy: 0.0406 +[2026-01-29T22:37:19.308422Z] Loop 3655: Loss: 8.53e-04, Avg Return: 0.460, Regret: 0.3507, Entropy: 0.0373 +[2026-01-29T22:37:20.470134Z] Loop 3656: Loss: 9.99e-04, Avg Return: 0.457, Regret: 0.3507, Entropy: 0.0393 +[2026-01-29T22:37:21.629979Z] Loop 3657: Loss: 8.03e-04, Avg Return: 0.454, Regret: 0.3507, Entropy: 0.0382 +[2026-01-29T22:37:22.791509Z] Loop 3658: Loss: 8.99e-04, Avg Return: 0.452, Regret: 0.3507, Entropy: 0.0363 +[2026-01-29T22:37:23.953131Z] Loop 3659: Loss: 1.01e-03, Avg Return: 0.453, Regret: 0.3507, Entropy: 0.0387 +[2026-01-29T22:37:25.158414Z] Loop 3660: Loss: 1.04e-03, Avg Return: 0.462, Regret: 0.3507, Entropy: 0.0431 +[2026-01-29T22:37:26.319672Z] Loop 3661: Loss: 1.26e-03, Avg Return: 0.456, Regret: 0.3507, Entropy: 0.0410 +[2026-01-29T22:37:27.480422Z] Loop 3662: Loss: 1.41e-03, Avg Return: 0.450, Regret: 0.3507, Entropy: 0.0450 +[2026-01-29T22:37:28.641580Z] Loop 3663: Loss: 1.50e-03, Avg Return: 0.451, Regret: 0.3507, Entropy: 0.0493 +[2026-01-29T22:37:29.802394Z] Loop 3664: Loss: 1.57e-03, Avg Return: 0.455, Regret: 0.3507, Entropy: 0.0535 +[2026-01-29T22:37:30.964038Z] Loop 3665: Loss: 1.44e-03, Avg Return: 0.455, Regret: 0.3507, Entropy: 0.0488 +[2026-01-29T22:37:32.123884Z] Loop 3666: Loss: 1.85e-03, Avg Return: 0.445, Regret: 0.3507, Entropy: 0.0562 +[2026-01-29T22:37:33.285081Z] Loop 3667: Loss: 2.15e-03, Avg Return: 0.451, Regret: 0.3507, Entropy: 0.0538 +[2026-01-29T22:37:34.446523Z] Loop 3668: Loss: 2.11e-03, Avg Return: 0.448, Regret: 0.3507, Entropy: 0.0554 +[2026-01-29T22:37:35.607164Z] Loop 3669: Loss: 2.08e-03, Avg Return: 0.455, Regret: 0.3507, Entropy: 0.0536 +[2026-01-29T22:37:36.813099Z] Loop 3670: Loss: 2.09e-03, Avg Return: 0.455, Regret: 0.3516, Entropy: 0.0557 +[2026-01-29T22:37:37.974413Z] Loop 3671: Loss: 2.05e-03, Avg Return: 0.458, Regret: 0.3516, Entropy: 0.0555 +[2026-01-29T22:37:39.136249Z] Loop 3672: Loss: 1.91e-03, Avg Return: 0.454, Regret: 0.3516, Entropy: 0.0517 +[2026-01-29T22:37:40.296734Z] Loop 3673: Loss: 1.88e-03, Avg Return: 0.448, Regret: 0.3516, Entropy: 0.0554 +[2026-01-29T22:37:41.458094Z] Loop 3674: Loss: 1.76e-03, Avg Return: 0.455, Regret: 0.3516, Entropy: 0.0539 +[2026-01-29T22:37:42.618061Z] Loop 3675: Loss: 1.93e-03, Avg Return: 0.455, Regret: 0.3516, Entropy: 0.0538 +[2026-01-29T22:37:43.779952Z] Loop 3676: Loss: 1.80e-03, Avg Return: 0.453, Regret: 0.3516, Entropy: 0.0547 +[2026-01-29T22:37:44.941753Z] Loop 3677: Loss: 1.52e-03, Avg Return: 0.456, Regret: 0.3516, Entropy: 0.0452 +[2026-01-29T22:37:46.102276Z] Loop 3678: Loss: 1.64e-03, Avg Return: 0.448, Regret: 0.3516, Entropy: 0.0488 +[2026-01-29T22:37:47.263670Z] Loop 3679: Loss: 1.61e-03, Avg Return: 0.458, Regret: 0.3516, Entropy: 0.0479 +[2026-01-29T22:37:48.467186Z] Loop 3680: Loss: 1.64e-03, Avg Return: 0.452, Regret: 0.3511, Entropy: 0.0467 +[2026-01-29T22:37:49.628954Z] Loop 3681: Loss: 1.73e-03, Avg Return: 0.461, Regret: 0.3511, Entropy: 0.0492 +[2026-01-29T22:37:50.790123Z] Loop 3682: Loss: 1.80e-03, Avg Return: 0.460, Regret: 0.3511, Entropy: 0.0493 +[2026-01-29T22:37:51.952339Z] Loop 3683: Loss: 1.61e-03, Avg Return: 0.454, Regret: 0.3511, Entropy: 0.0472 +[2026-01-29T22:37:53.112595Z] Loop 3684: Loss: 1.88e-03, Avg Return: 0.454, Regret: 0.3511, Entropy: 0.0493 +[2026-01-29T22:37:54.274084Z] Loop 3685: Loss: 1.67e-03, Avg Return: 0.452, Regret: 0.3511, Entropy: 0.0462 +[2026-01-29T22:37:55.434866Z] Loop 3686: Loss: 1.63e-03, Avg Return: 0.450, Regret: 0.3511, Entropy: 0.0470 +[2026-01-29T22:37:56.595571Z] Loop 3687: Loss: 1.80e-03, Avg Return: 0.455, Regret: 0.3511, Entropy: 0.0487 +[2026-01-29T22:37:57.757256Z] Loop 3688: Loss: 1.74e-03, Avg Return: 0.455, Regret: 0.3511, Entropy: 0.0451 +[2026-01-29T22:37:58.918071Z] Loop 3689: Loss: 1.43e-03, Avg Return: 0.449, Regret: 0.3511, Entropy: 0.0429 +[2026-01-29T22:38:00.124968Z] Loop 3690: Loss: 1.78e-03, Avg Return: 0.446, Regret: 0.3534, Entropy: 0.0506 +[2026-01-29T22:38:01.286274Z] Loop 3691: Loss: 1.94e-03, Avg Return: 0.447, Regret: 0.3534, Entropy: 0.0495 +[2026-01-29T22:38:02.448151Z] Loop 3692: Loss: 1.62e-03, Avg Return: 0.447, Regret: 0.3534, Entropy: 0.0457 +[2026-01-29T22:38:03.609031Z] Loop 3693: Loss: 1.88e-03, Avg Return: 0.452, Regret: 0.3534, Entropy: 0.0461 +[2026-01-29T22:38:04.770556Z] Loop 3694: Loss: 2.11e-03, Avg Return: 0.452, Regret: 0.3534, Entropy: 0.0504 +[2026-01-29T22:38:05.937543Z] Loop 3695: Loss: 2.14e-03, Avg Return: 0.453, Regret: 0.3534, Entropy: 0.0551 +[2026-01-29T22:38:07.098501Z] Loop 3696: Loss: 2.05e-03, Avg Return: 0.444, Regret: 0.3534, Entropy: 0.0556 +[2026-01-29T22:38:08.260247Z] Loop 3697: Loss: 1.85e-03, Avg Return: 0.445, Regret: 0.3534, Entropy: 0.0507 +[2026-01-29T22:38:09.420225Z] Loop 3698: Loss: 1.72e-03, Avg Return: 0.447, Regret: 0.3534, Entropy: 0.0525 +[2026-01-29T22:38:10.581491Z] Loop 3699: Loss: 1.46e-03, Avg Return: 0.437, Regret: 0.3534, Entropy: 0.0506 +[2026-01-29T22:38:11.786037Z] Loop 3700: Loss: 1.63e-03, Avg Return: 0.451, Regret: 0.3556, Entropy: 0.0515 +[2026-01-29T22:38:12.947688Z] Loop 3701: Loss: 1.91e-03, Avg Return: 0.450, Regret: 0.3556, Entropy: 0.0504 +[2026-01-29T22:38:14.107814Z] Loop 3702: Loss: 1.88e-03, Avg Return: 0.448, Regret: 0.3556, Entropy: 0.0548 +[2026-01-29T22:38:15.269099Z] Loop 3703: Loss: 1.72e-03, Avg Return: 0.441, Regret: 0.3556, Entropy: 0.0528 +[2026-01-29T22:38:16.430715Z] Loop 3704: Loss: 2.15e-03, Avg Return: 0.449, Regret: 0.3556, Entropy: 0.0579 +[2026-01-29T22:38:17.592027Z] Loop 3705: Loss: 2.11e-03, Avg Return: 0.451, Regret: 0.3556, Entropy: 0.0566 +[2026-01-29T22:38:18.753473Z] Loop 3706: Loss: 2.20e-03, Avg Return: 0.455, Regret: 0.3556, Entropy: 0.0571 +[2026-01-29T22:38:19.913482Z] Loop 3707: Loss: 2.00e-03, Avg Return: 0.457, Regret: 0.3556, Entropy: 0.0513 +[2026-01-29T22:38:21.074415Z] Loop 3708: Loss: 1.72e-03, Avg Return: 0.456, Regret: 0.3556, Entropy: 0.0531 +[2026-01-29T22:38:22.233887Z] Loop 3709: Loss: 1.69e-03, Avg Return: 0.456, Regret: 0.3556, Entropy: 0.0526 +[2026-01-29T22:38:23.437131Z] Loop 3710: Loss: 1.92e-03, Avg Return: 0.452, Regret: 0.3511, Entropy: 0.0481 +[2026-01-29T22:38:24.597287Z] Loop 3711: Loss: 1.32e-03, Avg Return: 0.448, Regret: 0.3511, Entropy: 0.0468 +[2026-01-29T22:38:25.758435Z] Loop 3712: Loss: 1.51e-03, Avg Return: 0.445, Regret: 0.3511, Entropy: 0.0458 +[2026-01-29T22:38:26.918187Z] Loop 3713: Loss: 1.68e-03, Avg Return: 0.456, Regret: 0.3511, Entropy: 0.0466 +[2026-01-29T22:38:28.079157Z] Loop 3714: Loss: 1.67e-03, Avg Return: 0.456, Regret: 0.3511, Entropy: 0.0539 +[2026-01-29T22:38:29.240568Z] Loop 3715: Loss: 2.23e-03, Avg Return: 0.449, Regret: 0.3511, Entropy: 0.0635 +[2026-01-29T22:38:30.401557Z] Loop 3716: Loss: 2.87e-03, Avg Return: 0.455, Regret: 0.3511, Entropy: 0.0697 +[2026-01-29T22:38:31.562990Z] Loop 3717: Loss: 2.10e-03, Avg Return: 0.454, Regret: 0.3511, Entropy: 0.0635 +[2026-01-29T22:38:32.723943Z] Loop 3718: Loss: 1.57e-03, Avg Return: 0.454, Regret: 0.3511, Entropy: 0.0639 +[2026-01-29T22:38:33.885264Z] Loop 3719: Loss: 8.23e-04, Avg Return: 0.451, Regret: 0.3511, Entropy: 0.0619 +[2026-01-29T22:38:35.097129Z] Loop 3720: Loss: 6.30e-04, Avg Return: 0.453, Regret: 0.3510, Entropy: 0.0581 +[2026-01-29T22:38:36.258784Z] Loop 3721: Loss: 7.21e-04, Avg Return: 0.452, Regret: 0.3510, Entropy: 0.0548 +[2026-01-29T22:38:37.420436Z] Loop 3722: Loss: 9.91e-04, Avg Return: 0.452, Regret: 0.3510, Entropy: 0.0632 +[2026-01-29T22:38:38.581609Z] Loop 3723: Loss: 1.40e-03, Avg Return: 0.452, Regret: 0.3510, Entropy: 0.0668 +[2026-01-29T22:38:39.742785Z] Loop 3724: Loss: 1.53e-03, Avg Return: 0.454, Regret: 0.3510, Entropy: 0.0641 +[2026-01-29T22:38:40.903291Z] Loop 3725: Loss: 1.13e-03, Avg Return: 0.454, Regret: 0.3510, Entropy: 0.0611 +[2026-01-29T22:38:42.064838Z] Loop 3726: Loss: 9.25e-04, Avg Return: 0.450, Regret: 0.3510, Entropy: 0.0623 +[2026-01-29T22:38:43.226398Z] Loop 3727: Loss: 9.44e-04, Avg Return: 0.451, Regret: 0.3510, Entropy: 0.0644 +[2026-01-29T22:38:44.387204Z] Loop 3728: Loss: 7.54e-04, Avg Return: 0.453, Regret: 0.3510, Entropy: 0.0660 +[2026-01-29T22:38:45.548909Z] Loop 3729: Loss: 9.75e-04, Avg Return: 0.456, Regret: 0.3510, Entropy: 0.0614 +[2026-01-29T22:38:46.759333Z] Loop 3730: Loss: 7.42e-04, Avg Return: 0.452, Regret: 0.3517, Entropy: 0.0595 +[2026-01-29T22:38:47.923392Z] Loop 3731: Loss: 6.44e-04, Avg Return: 0.446, Regret: 0.3517, Entropy: 0.0569 +[2026-01-29T22:38:49.085012Z] Loop 3732: Loss: 5.69e-04, Avg Return: 0.441, Regret: 0.3517, Entropy: 0.0575 +[2026-01-29T22:38:50.247400Z] Loop 3733: Loss: 6.78e-04, Avg Return: 0.451, Regret: 0.3517, Entropy: 0.0513 +[2026-01-29T22:38:51.408075Z] Loop 3734: Loss: 3.98e-04, Avg Return: 0.453, Regret: 0.3517, Entropy: 0.0517 +[2026-01-29T22:38:52.571313Z] Loop 3735: Loss: 3.41e-04, Avg Return: 0.454, Regret: 0.3517, Entropy: 0.0485 +[2026-01-29T22:38:53.734029Z] Loop 3736: Loss: 5.43e-04, Avg Return: 0.452, Regret: 0.3517, Entropy: 0.0519 +[2026-01-29T22:38:54.895159Z] Loop 3737: Loss: 5.51e-04, Avg Return: 0.452, Regret: 0.3517, Entropy: 0.0540 +[2026-01-29T22:38:56.057022Z] Loop 3738: Loss: 5.29e-04, Avg Return: 0.455, Regret: 0.3517, Entropy: 0.0484 +[2026-01-29T22:38:57.218228Z] Loop 3739: Loss: 6.67e-04, Avg Return: 0.456, Regret: 0.3517, Entropy: 0.0488 +[2026-01-29T22:38:58.430544Z] Loop 3740: Loss: 8.41e-04, Avg Return: 0.446, Regret: 0.3526, Entropy: 0.0501 +[2026-01-29T22:38:59.592358Z] Loop 3741: Loss: 1.19e-03, Avg Return: 0.450, Regret: 0.3526, Entropy: 0.0548 +[2026-01-29T22:39:00.754460Z] Loop 3742: Loss: 1.10e-03, Avg Return: 0.449, Regret: 0.3526, Entropy: 0.0541 +[2026-01-29T22:39:01.916664Z] Loop 3743: Loss: 1.16e-03, Avg Return: 0.448, Regret: 0.3526, Entropy: 0.0524 +[2026-01-29T22:39:03.078176Z] Loop 3744: Loss: 1.06e-03, Avg Return: 0.452, Regret: 0.3526, Entropy: 0.0552 +[2026-01-29T22:39:04.240657Z] Loop 3745: Loss: 7.13e-04, Avg Return: 0.455, Regret: 0.3526, Entropy: 0.0491 +[2026-01-29T22:39:05.401501Z] Loop 3746: Loss: 6.06e-04, Avg Return: 0.452, Regret: 0.3526, Entropy: 0.0494 +[2026-01-29T22:39:06.563430Z] Loop 3747: Loss: 4.39e-04, Avg Return: 0.450, Regret: 0.3526, Entropy: 0.0511 +[2026-01-29T22:39:07.726042Z] Loop 3748: Loss: 4.71e-04, Avg Return: 0.454, Regret: 0.3526, Entropy: 0.0517 +[2026-01-29T22:39:08.887388Z] Loop 3749: Loss: 5.46e-04, Avg Return: 0.455, Regret: 0.3526, Entropy: 0.0542 +[2026-01-29T22:39:10.094279Z] Loop 3750: Loss: 5.26e-04, Avg Return: 0.448, Regret: 0.3510, Entropy: 0.0552 +[2026-01-29T22:39:11.255426Z] Loop 3751: Loss: 6.42e-04, Avg Return: 0.456, Regret: 0.3510, Entropy: 0.0536 +[2026-01-29T22:39:12.417464Z] Loop 3752: Loss: 6.92e-04, Avg Return: 0.449, Regret: 0.3510, Entropy: 0.0615 +[2026-01-29T22:39:13.577753Z] Loop 3753: Loss: 8.52e-04, Avg Return: 0.450, Regret: 0.3510, Entropy: 0.0619 +[2026-01-29T22:39:14.739597Z] Loop 3754: Loss: 7.27e-04, Avg Return: 0.457, Regret: 0.3510, Entropy: 0.0595 +[2026-01-29T22:39:15.900448Z] Loop 3755: Loss: 6.98e-04, Avg Return: 0.447, Regret: 0.3510, Entropy: 0.0585 +[2026-01-29T22:39:17.062561Z] Loop 3756: Loss: 8.26e-04, Avg Return: 0.453, Regret: 0.3510, Entropy: 0.0579 +[2026-01-29T22:39:18.224055Z] Loop 3757: Loss: 7.93e-04, Avg Return: 0.453, Regret: 0.3510, Entropy: 0.0619 +[2026-01-29T22:39:19.386156Z] Loop 3758: Loss: 7.46e-04, Avg Return: 0.452, Regret: 0.3510, Entropy: 0.0644 +[2026-01-29T22:39:20.548093Z] Loop 3759: Loss: 8.61e-04, Avg Return: 0.449, Regret: 0.3510, Entropy: 0.0670 +[2026-01-29T22:39:21.753012Z] Loop 3760: Loss: 8.69e-04, Avg Return: 0.448, Regret: 0.3507, Entropy: 0.0625 +[2026-01-29T22:39:22.917243Z] Loop 3761: Loss: 9.99e-04, Avg Return: 0.454, Regret: 0.3507, Entropy: 0.0666 +[2026-01-29T22:39:24.080079Z] Loop 3762: Loss: 9.05e-04, Avg Return: 0.455, Regret: 0.3507, Entropy: 0.0705 +[2026-01-29T22:39:25.245145Z] Loop 3763: Loss: 1.02e-03, Avg Return: 0.453, Regret: 0.3507, Entropy: 0.0610 +[2026-01-29T22:39:26.407862Z] Loop 3764: Loss: 1.04e-03, Avg Return: 0.452, Regret: 0.3507, Entropy: 0.0642 +[2026-01-29T22:39:27.567809Z] Loop 3765: Loss: 1.15e-03, Avg Return: 0.451, Regret: 0.3507, Entropy: 0.0628 +[2026-01-29T22:39:28.729669Z] Loop 3766: Loss: 1.06e-03, Avg Return: 0.452, Regret: 0.3507, Entropy: 0.0669 +[2026-01-29T22:39:29.890204Z] Loop 3767: Loss: 1.20e-03, Avg Return: 0.449, Regret: 0.3507, Entropy: 0.0694 +[2026-01-29T22:39:31.050732Z] Loop 3768: Loss: 1.23e-03, Avg Return: 0.448, Regret: 0.3507, Entropy: 0.0696