diff --git a/reward_1707748949.611114_config.reward_from=llm_task_index=12_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=12_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s0/progress.txt b/reward_1707748949.611114_config.reward_from=llm_task_index=12_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=12_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s0/progress.txt new file mode 100644 index 0000000000000000000000000000000000000000..0665dd7cda7bba286a01f139636b205a4294a056 --- /dev/null +++ b/reward_1707748949.611114_config.reward_from=llm_task_index=12_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=12_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s0/progress.txt @@ -0,0 +1,2 @@ +Epoch AverageEpActualRet StdEpActualRet MaxEpActualRet MinEpActualRet AverageEpLambAdjRet StdEpLambAdjRet MaxEpLambAdjRet MinEpLambAdjRet AverageVVals StdVVals MaxVVals MinVVals Lamb Time +0 953.0 0.0 953.0 953.0 652.83594 0.0 652.83594 652.83594 -0.002168625 0.045007654 0.059986245 -0.07406212 0.33057702 2.4347472190856934 diff --git a/reward_1707748949.611114_config.reward_from=llm_task_index=12_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=12_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s0/pyt_save/model.pt b/reward_1707748949.611114_config.reward_from=llm_task_index=12_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=12_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s0/pyt_save/model.pt new file mode 100644 index 0000000000000000000000000000000000000000..9f59a87e6abe089f20e2e1d543d04c202f849672 --- /dev/null +++ b/reward_1707748949.611114_config.reward_from=llm_task_index=12_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=12_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s0/pyt_save/model.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:078ce9e6cec48a03210cd96bbdfafdfaaf9a911c7a156af1ec376a4a0850b3ce +size 26198 diff --git a/reward_1707748949.611114_config.reward_from=llm_task_index=12_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=12_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s0/vars.pkl b/reward_1707748949.611114_config.reward_from=llm_task_index=12_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=12_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s0/vars.pkl new file mode 100644 index 0000000000000000000000000000000000000000..54013b6d6c78aa772e01cfa85fd1268adb8ac11b --- /dev/null +++ b/reward_1707748949.611114_config.reward_from=llm_task_index=12_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=12_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s0/vars.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92ea2e1ec564527e3eda889a660916cf8391e187b0b03eca4b7d2467c96d0991 +size 13916 diff --git a/reward_1707748949.611114_config.reward_from=llm_task_index=12_stage=0_iteration=1_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=12_stage=0_iteration=1_n21b7.0dcounterexamplersample_randomp0_s0/progress.txt b/reward_1707748949.611114_config.reward_from=llm_task_index=12_stage=0_iteration=1_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=12_stage=0_iteration=1_n21b7.0dcounterexamplersample_randomp0_s0/progress.txt new file mode 100644 index 0000000000000000000000000000000000000000..0fdc912226bd0edd1bd3def939fc02fdb9cd183d --- /dev/null +++ b/reward_1707748949.611114_config.reward_from=llm_task_index=12_stage=0_iteration=1_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=12_stage=0_iteration=1_n21b7.0dcounterexamplersample_randomp0_s0/progress.txt @@ -0,0 +1,2 @@ +Epoch AverageEpActualRet StdEpActualRet MaxEpActualRet MinEpActualRet AverageEpLambAdjRet StdEpLambAdjRet MaxEpLambAdjRet MinEpLambAdjRet AverageVVals StdVVals MaxVVals MinVVals Lamb Time +0 1376.0 0.0 1376.0 1376.0 1095.3876 0.0 1095.3876 1095.3876 0.0021131376 0.045713313 0.05986391 -0.074177615 0.3324795 1.2189209461212158 diff --git a/reward_1707748949.611114_config.reward_from=llm_task_index=12_stage=0_iteration=1_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=12_stage=0_iteration=1_n21b7.0dcounterexamplersample_randomp0_s0/pyt_save/model.pt b/reward_1707748949.611114_config.reward_from=llm_task_index=12_stage=0_iteration=1_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=12_stage=0_iteration=1_n21b7.0dcounterexamplersample_randomp0_s0/pyt_save/model.pt new file mode 100644 index 0000000000000000000000000000000000000000..33bba8a7e00960901dfcd530598305624f303b76 --- /dev/null +++ b/reward_1707748949.611114_config.reward_from=llm_task_index=12_stage=0_iteration=1_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=12_stage=0_iteration=1_n21b7.0dcounterexamplersample_randomp0_s0/pyt_save/model.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ccd69b46ea9ea2ae5a0f3f070e9cac631c78b2a3fae1a3be584a211a4f729b4f +size 26198 diff --git a/reward_1707748949.611114_config.reward_from=llm_task_index=12_stage=0_iteration=1_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=12_stage=0_iteration=1_n21b7.0dcounterexamplersample_randomp0_s0/vars.pkl b/reward_1707748949.611114_config.reward_from=llm_task_index=12_stage=0_iteration=1_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=12_stage=0_iteration=1_n21b7.0dcounterexamplersample_randomp0_s0/vars.pkl new file mode 100644 index 0000000000000000000000000000000000000000..54013b6d6c78aa772e01cfa85fd1268adb8ac11b --- /dev/null +++ b/reward_1707748949.611114_config.reward_from=llm_task_index=12_stage=0_iteration=1_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=12_stage=0_iteration=1_n21b7.0dcounterexamplersample_randomp0_s0/vars.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92ea2e1ec564527e3eda889a660916cf8391e187b0b03eca4b7d2467c96d0991 +size 13916 diff --git a/reward_1707748949.611114_config.reward_from=llm_task_index=12_stage=1_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=12_stage=1_iteration=0_n21b7.0dcounterexamplersample_randomp0_s0/progress.txt b/reward_1707748949.611114_config.reward_from=llm_task_index=12_stage=1_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=12_stage=1_iteration=0_n21b7.0dcounterexamplersample_randomp0_s0/progress.txt new file mode 100644 index 0000000000000000000000000000000000000000..0df84992ccbacbfe25f1404b71db25fc00756fdc --- /dev/null +++ b/reward_1707748949.611114_config.reward_from=llm_task_index=12_stage=1_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=12_stage=1_iteration=0_n21b7.0dcounterexamplersample_randomp0_s0/progress.txt @@ -0,0 +1,2 @@ +Epoch AverageEpActualRet StdEpActualRet MaxEpActualRet MinEpActualRet AverageEpLambAdjRet StdEpLambAdjRet MaxEpLambAdjRet MinEpLambAdjRet AverageVVals StdVVals MaxVVals MinVVals Lamb Time +0 1604.0 0.0 1604.0 1604.0 1277.858 0.0 1277.858 1277.858 -0.007816804 0.04234601 0.04392085 -0.07385238 0.32712317 1.3374824523925781 diff --git a/reward_1707748949.611114_config.reward_from=llm_task_index=12_stage=1_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=12_stage=1_iteration=0_n21b7.0dcounterexamplersample_randomp0_s0/pyt_save/model.pt b/reward_1707748949.611114_config.reward_from=llm_task_index=12_stage=1_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=12_stage=1_iteration=0_n21b7.0dcounterexamplersample_randomp0_s0/pyt_save/model.pt new file mode 100644 index 0000000000000000000000000000000000000000..cc30dbc94a29543e792bc6333d319858d68a348f --- /dev/null +++ b/reward_1707748949.611114_config.reward_from=llm_task_index=12_stage=1_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=12_stage=1_iteration=0_n21b7.0dcounterexamplersample_randomp0_s0/pyt_save/model.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc4e78f36d34a76e929ff642de1a30e4cabf43ad7db5584b3f7fe370fac5626c +size 26198 diff --git a/reward_1707748949.611114_config.reward_from=llm_task_index=12_stage=1_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=12_stage=1_iteration=0_n21b7.0dcounterexamplersample_randomp0_s0/vars.pkl b/reward_1707748949.611114_config.reward_from=llm_task_index=12_stage=1_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=12_stage=1_iteration=0_n21b7.0dcounterexamplersample_randomp0_s0/vars.pkl new file mode 100644 index 0000000000000000000000000000000000000000..54013b6d6c78aa772e01cfa85fd1268adb8ac11b --- /dev/null +++ b/reward_1707748949.611114_config.reward_from=llm_task_index=12_stage=1_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=12_stage=1_iteration=0_n21b7.0dcounterexamplersample_randomp0_s0/vars.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92ea2e1ec564527e3eda889a660916cf8391e187b0b03eca4b7d2467c96d0991 +size 13916 diff --git a/reward_1707748949.611114_config.reward_from=llm_task_index=12_stage=1_iteration=1_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=12_stage=1_iteration=1_n21b7.0dcounterexamplersample_randomp0_s0/progress.txt b/reward_1707748949.611114_config.reward_from=llm_task_index=12_stage=1_iteration=1_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=12_stage=1_iteration=1_n21b7.0dcounterexamplersample_randomp0_s0/progress.txt new file mode 100644 index 0000000000000000000000000000000000000000..bde01934d14f755a29289761cdb12a80734eec1c --- /dev/null +++ b/reward_1707748949.611114_config.reward_from=llm_task_index=12_stage=1_iteration=1_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=12_stage=1_iteration=1_n21b7.0dcounterexamplersample_randomp0_s0/progress.txt @@ -0,0 +1,2 @@ +Epoch AverageEpActualRet StdEpActualRet MaxEpActualRet MinEpActualRet AverageEpLambAdjRet StdEpLambAdjRet MaxEpLambAdjRet MinEpLambAdjRet AverageVVals StdVVals MaxVVals MinVVals Lamb Time +0 2580.0 0.0 2580.0 2580.0 2303.1753 0.0 2303.1753 2303.1753 0.00021175982 0.044766117 0.06119552 -0.07291788 0.31173953 1.2636334896087646 diff --git a/reward_1707748949.611114_config.reward_from=llm_task_index=12_stage=1_iteration=1_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=12_stage=1_iteration=1_n21b7.0dcounterexamplersample_randomp0_s0/pyt_save/model.pt b/reward_1707748949.611114_config.reward_from=llm_task_index=12_stage=1_iteration=1_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=12_stage=1_iteration=1_n21b7.0dcounterexamplersample_randomp0_s0/pyt_save/model.pt new file mode 100644 index 0000000000000000000000000000000000000000..09c4c375b1f9414f040ebcf43d12ee7526353f27 --- /dev/null +++ b/reward_1707748949.611114_config.reward_from=llm_task_index=12_stage=1_iteration=1_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=12_stage=1_iteration=1_n21b7.0dcounterexamplersample_randomp0_s0/pyt_save/model.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:496d97394e097575b6e037199f6cfb8ba91408a063dff727be0ec56775229ed4 +size 26198 diff --git a/reward_1707748949.611114_config.reward_from=llm_task_index=12_stage=1_iteration=1_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=12_stage=1_iteration=1_n21b7.0dcounterexamplersample_randomp0_s0/vars.pkl b/reward_1707748949.611114_config.reward_from=llm_task_index=12_stage=1_iteration=1_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=12_stage=1_iteration=1_n21b7.0dcounterexamplersample_randomp0_s0/vars.pkl new file mode 100644 index 0000000000000000000000000000000000000000..54013b6d6c78aa772e01cfa85fd1268adb8ac11b --- /dev/null +++ b/reward_1707748949.611114_config.reward_from=llm_task_index=12_stage=1_iteration=1_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=12_stage=1_iteration=1_n21b7.0dcounterexamplersample_randomp0_s0/vars.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92ea2e1ec564527e3eda889a660916cf8391e187b0b03eca4b7d2467c96d0991 +size 13916 diff --git a/reward_1707748949.611114_config.reward_from=llm_task_index=13_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=13_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s0/progress.txt b/reward_1707748949.611114_config.reward_from=llm_task_index=13_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=13_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s0/progress.txt new file mode 100644 index 0000000000000000000000000000000000000000..1440802339c184ee08065fec358fd7385c4fa1cd --- /dev/null +++ b/reward_1707748949.611114_config.reward_from=llm_task_index=13_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=13_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s0/progress.txt @@ -0,0 +1,2 @@ +Epoch AverageEpActualRet StdEpActualRet MaxEpActualRet MinEpActualRet AverageEpLambAdjRet StdEpLambAdjRet MaxEpLambAdjRet MinEpLambAdjRet AverageVVals StdVVals MaxVVals MinVVals Lamb Time +0 -19.5 0.0 -19.5 -19.5 -295.18323 0.0 -295.18323 -295.18323 0.004156622 0.04656521 0.05951858 -0.074503504 0.3378471 1.1905972957611084 diff --git a/reward_1707748949.611114_config.reward_from=llm_task_index=13_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=13_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s0/pyt_save/model.pt b/reward_1707748949.611114_config.reward_from=llm_task_index=13_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=13_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s0/pyt_save/model.pt new file mode 100644 index 0000000000000000000000000000000000000000..61f84e422332e77639882de5e2eaaeab30e458dc --- /dev/null +++ b/reward_1707748949.611114_config.reward_from=llm_task_index=13_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=13_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s0/pyt_save/model.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ebd032ec441a06f6968ca2b16b51682cd6e79833aa1efdec1cf38c19e364842 +size 26198 diff --git a/reward_1707748949.611114_config.reward_from=llm_task_index=13_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=13_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s0/vars.pkl b/reward_1707748949.611114_config.reward_from=llm_task_index=13_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=13_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s0/vars.pkl new file mode 100644 index 0000000000000000000000000000000000000000..54013b6d6c78aa772e01cfa85fd1268adb8ac11b --- /dev/null +++ b/reward_1707748949.611114_config.reward_from=llm_task_index=13_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=13_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s0/vars.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92ea2e1ec564527e3eda889a660916cf8391e187b0b03eca4b7d2467c96d0991 +size 13916 diff --git a/reward_1707748949.611114_config.reward_from=llm_task_index=13_stage=0_iteration=1_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=13_stage=0_iteration=1_n21b7.0dcounterexamplersample_randomp0_s0/progress.txt b/reward_1707748949.611114_config.reward_from=llm_task_index=13_stage=0_iteration=1_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=13_stage=0_iteration=1_n21b7.0dcounterexamplersample_randomp0_s0/progress.txt new file mode 100644 index 0000000000000000000000000000000000000000..133d068b48f976dbc2c9954f6937c21c5a02ce02 --- /dev/null +++ b/reward_1707748949.611114_config.reward_from=llm_task_index=13_stage=0_iteration=1_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=13_stage=0_iteration=1_n21b7.0dcounterexamplersample_randomp0_s0/progress.txt @@ -0,0 +1,2 @@ +Epoch AverageEpActualRet StdEpActualRet MaxEpActualRet MinEpActualRet AverageEpLambAdjRet StdEpLambAdjRet MaxEpLambAdjRet MinEpLambAdjRet AverageVVals StdVVals MaxVVals MinVVals Lamb Time +0 39.0 0.0 39.0 39.0 -238.53288 0.0 -238.53288 -238.53288 0.0017500948 0.04590834 0.060370363 -0.07369913 0.32459962 1.2593295574188232 diff --git a/reward_1707748949.611114_config.reward_from=llm_task_index=13_stage=0_iteration=1_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=13_stage=0_iteration=1_n21b7.0dcounterexamplersample_randomp0_s0/pyt_save/model.pt b/reward_1707748949.611114_config.reward_from=llm_task_index=13_stage=0_iteration=1_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=13_stage=0_iteration=1_n21b7.0dcounterexamplersample_randomp0_s0/pyt_save/model.pt new file mode 100644 index 0000000000000000000000000000000000000000..d0d5b5f4e401cacfe4e9d0ad007ccd0f1ab844da --- /dev/null +++ b/reward_1707748949.611114_config.reward_from=llm_task_index=13_stage=0_iteration=1_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=13_stage=0_iteration=1_n21b7.0dcounterexamplersample_randomp0_s0/pyt_save/model.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6aa19c4f4bad0ed96e8b7e614406ca263a6b40917c0fd32209306f0def6c65b +size 26198 diff --git a/reward_1707748949.611114_config.reward_from=llm_task_index=13_stage=0_iteration=1_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=13_stage=0_iteration=1_n21b7.0dcounterexamplersample_randomp0_s0/vars.pkl b/reward_1707748949.611114_config.reward_from=llm_task_index=13_stage=0_iteration=1_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=13_stage=0_iteration=1_n21b7.0dcounterexamplersample_randomp0_s0/vars.pkl new file mode 100644 index 0000000000000000000000000000000000000000..54013b6d6c78aa772e01cfa85fd1268adb8ac11b --- /dev/null +++ b/reward_1707748949.611114_config.reward_from=llm_task_index=13_stage=0_iteration=1_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=13_stage=0_iteration=1_n21b7.0dcounterexamplersample_randomp0_s0/vars.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92ea2e1ec564527e3eda889a660916cf8391e187b0b03eca4b7d2467c96d0991 +size 13916 diff --git a/reward_1707748949.611114_config.reward_from=llm_task_index=13_stage=1_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=13_stage=1_iteration=0_n21b7.0dcounterexamplersample_randomp0_s0/progress.txt b/reward_1707748949.611114_config.reward_from=llm_task_index=13_stage=1_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=13_stage=1_iteration=0_n21b7.0dcounterexamplersample_randomp0_s0/progress.txt new file mode 100644 index 0000000000000000000000000000000000000000..c0d01f903317c792eaab2e3695adfa426ea10a85 --- /dev/null +++ b/reward_1707748949.611114_config.reward_from=llm_task_index=13_stage=1_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=13_stage=1_iteration=0_n21b7.0dcounterexamplersample_randomp0_s0/progress.txt @@ -0,0 +1,2 @@ +Epoch AverageEpActualRet StdEpActualRet MaxEpActualRet MinEpActualRet AverageEpLambAdjRet StdEpLambAdjRet MaxEpLambAdjRet MinEpLambAdjRet AverageVVals StdVVals MaxVVals MinVVals Lamb Time +0 19.5 0.0 19.5 19.5 -201.3899 0.0 -201.3899 -201.3899 0.009826353 0.047053043 0.06222207 -0.07194317 0.29570273 1.1741359233856201 diff --git a/reward_1707748949.611114_config.reward_from=llm_task_index=13_stage=1_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=13_stage=1_iteration=0_n21b7.0dcounterexamplersample_randomp0_s0/pyt_save/model.pt b/reward_1707748949.611114_config.reward_from=llm_task_index=13_stage=1_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=13_stage=1_iteration=0_n21b7.0dcounterexamplersample_randomp0_s0/pyt_save/model.pt new file mode 100644 index 0000000000000000000000000000000000000000..cc24d2d1d892b6945b99bfa068681ff07acb9b75 --- /dev/null +++ b/reward_1707748949.611114_config.reward_from=llm_task_index=13_stage=1_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=13_stage=1_iteration=0_n21b7.0dcounterexamplersample_randomp0_s0/pyt_save/model.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67e38b43dbb2bf642fbf4d4f3f5280e8090d7c33344afa5885fce20fb44f6578 +size 26198 diff --git a/reward_1707748949.611114_config.reward_from=llm_task_index=13_stage=1_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=13_stage=1_iteration=0_n21b7.0dcounterexamplersample_randomp0_s0/vars.pkl b/reward_1707748949.611114_config.reward_from=llm_task_index=13_stage=1_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=13_stage=1_iteration=0_n21b7.0dcounterexamplersample_randomp0_s0/vars.pkl new file mode 100644 index 0000000000000000000000000000000000000000..54013b6d6c78aa772e01cfa85fd1268adb8ac11b --- /dev/null +++ b/reward_1707748949.611114_config.reward_from=llm_task_index=13_stage=1_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=13_stage=1_iteration=0_n21b7.0dcounterexamplersample_randomp0_s0/vars.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92ea2e1ec564527e3eda889a660916cf8391e187b0b03eca4b7d2467c96d0991 +size 13916 diff --git a/reward_1707748949.611114_config.reward_from=llm_task_index=13_stage=1_iteration=1_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=13_stage=1_iteration=1_n21b7.0dcounterexamplersample_randomp0_s0/progress.txt b/reward_1707748949.611114_config.reward_from=llm_task_index=13_stage=1_iteration=1_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=13_stage=1_iteration=1_n21b7.0dcounterexamplersample_randomp0_s0/progress.txt new file mode 100644 index 0000000000000000000000000000000000000000..01744509adf84131f31dff764c421196584522a4 --- /dev/null +++ b/reward_1707748949.611114_config.reward_from=llm_task_index=13_stage=1_iteration=1_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=13_stage=1_iteration=1_n21b7.0dcounterexamplersample_randomp0_s0/progress.txt @@ -0,0 +1,2 @@ +Epoch AverageEpActualRet StdEpActualRet MaxEpActualRet MinEpActualRet AverageEpLambAdjRet StdEpLambAdjRet MaxEpLambAdjRet MinEpLambAdjRet AverageVVals StdVVals MaxVVals MinVVals Lamb Time +0 39.0 0.0 39.0 39.0 -227.24684 0.0 -227.24684 -227.24684 -0.00016120703 0.044984415 0.061915003 -0.07223507 0.3005043 1.2381904125213623 diff --git a/reward_1707748949.611114_config.reward_from=llm_task_index=13_stage=1_iteration=1_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=13_stage=1_iteration=1_n21b7.0dcounterexamplersample_randomp0_s0/pyt_save/model.pt b/reward_1707748949.611114_config.reward_from=llm_task_index=13_stage=1_iteration=1_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=13_stage=1_iteration=1_n21b7.0dcounterexamplersample_randomp0_s0/pyt_save/model.pt new file mode 100644 index 0000000000000000000000000000000000000000..9965b05fb83478b7b0f8ca2a20b9ee1e30c314e6 --- /dev/null +++ b/reward_1707748949.611114_config.reward_from=llm_task_index=13_stage=1_iteration=1_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=13_stage=1_iteration=1_n21b7.0dcounterexamplersample_randomp0_s0/pyt_save/model.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0276f41badc0b9693f26de5f14bd31136ea2dd23cd6bf316eb7af475477c5ace +size 26198 diff --git a/reward_1707748949.611114_config.reward_from=llm_task_index=13_stage=1_iteration=1_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=13_stage=1_iteration=1_n21b7.0dcounterexamplersample_randomp0_s0/vars.pkl b/reward_1707748949.611114_config.reward_from=llm_task_index=13_stage=1_iteration=1_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=13_stage=1_iteration=1_n21b7.0dcounterexamplersample_randomp0_s0/vars.pkl new file mode 100644 index 0000000000000000000000000000000000000000..54013b6d6c78aa772e01cfa85fd1268adb8ac11b --- /dev/null +++ b/reward_1707748949.611114_config.reward_from=llm_task_index=13_stage=1_iteration=1_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=13_stage=1_iteration=1_n21b7.0dcounterexamplersample_randomp0_s0/vars.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92ea2e1ec564527e3eda889a660916cf8391e187b0b03eca4b7d2467c96d0991 +size 13916 diff --git a/reward_1707748949.611114_config.reward_from=llm_task_index=14_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=14_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s0/progress.txt b/reward_1707748949.611114_config.reward_from=llm_task_index=14_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=14_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s0/progress.txt new file mode 100644 index 0000000000000000000000000000000000000000..c50a8b0216e6e35864bc12fe35c1ccc070b80899 --- /dev/null +++ b/reward_1707748949.611114_config.reward_from=llm_task_index=14_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=14_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s0/progress.txt @@ -0,0 +1,2 @@ +Epoch AverageEpActualRet StdEpActualRet MaxEpActualRet MinEpActualRet AverageEpLambAdjRet StdEpLambAdjRet MaxEpLambAdjRet MinEpLambAdjRet AverageVVals StdVVals MaxVVals MinVVals Lamb Time +0 214.0 0.0 214.0 214.0 -55.185673 0.0 -55.185673 -55.185673 0.0041629653 0.04669452 0.060185533 -0.073873825 0.32747644 1.1202867031097412 diff --git a/reward_1707748949.611114_config.reward_from=llm_task_index=14_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=14_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s0/pyt_save/model.pt b/reward_1707748949.611114_config.reward_from=llm_task_index=14_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=14_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s0/pyt_save/model.pt new file mode 100644 index 0000000000000000000000000000000000000000..8fb7fa9b1eb91c68d9d1eaa0badee3ef7a899541 --- /dev/null +++ b/reward_1707748949.611114_config.reward_from=llm_task_index=14_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=14_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s0/pyt_save/model.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f504428ffdfb0cf9d1594a1b55a3e11b894b42949703ac99e2bce2f8b7c3b881 +size 26198 diff --git a/reward_1707748949.611114_config.reward_from=llm_task_index=14_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=14_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s0/vars.pkl b/reward_1707748949.611114_config.reward_from=llm_task_index=14_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=14_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s0/vars.pkl new file mode 100644 index 0000000000000000000000000000000000000000..54013b6d6c78aa772e01cfa85fd1268adb8ac11b --- /dev/null +++ b/reward_1707748949.611114_config.reward_from=llm_task_index=14_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=14_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s0/vars.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92ea2e1ec564527e3eda889a660916cf8391e187b0b03eca4b7d2467c96d0991 +size 13916 diff --git a/reward_1707748949.611114_config.reward_from=llm_task_index=14_stage=0_iteration=1_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=14_stage=0_iteration=1_n21b7.0dcounterexamplersample_randomp0_s0/progress.txt b/reward_1707748949.611114_config.reward_from=llm_task_index=14_stage=0_iteration=1_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=14_stage=0_iteration=1_n21b7.0dcounterexamplersample_randomp0_s0/progress.txt new file mode 100644 index 0000000000000000000000000000000000000000..3946cdb28adb82fc0d0c0b350bdaf5d44749818e --- /dev/null +++ b/reward_1707748949.611114_config.reward_from=llm_task_index=14_stage=0_iteration=1_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=14_stage=0_iteration=1_n21b7.0dcounterexamplersample_randomp0_s0/progress.txt @@ -0,0 +1,2 @@ +Epoch AverageEpActualRet StdEpActualRet MaxEpActualRet MinEpActualRet AverageEpLambAdjRet StdEpLambAdjRet MaxEpLambAdjRet MinEpLambAdjRet AverageVVals StdVVals MaxVVals MinVVals Lamb Time +0 942.0 0.0 942.0 942.0 609.8738 0.0 609.8738 609.8738 -0.0059993602 0.043736286 0.05904211 -0.07495253 0.34524554 1.22102689743042 diff --git a/reward_1707748949.611114_config.reward_from=llm_task_index=14_stage=0_iteration=1_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=14_stage=0_iteration=1_n21b7.0dcounterexamplersample_randomp0_s0/pyt_save/model.pt b/reward_1707748949.611114_config.reward_from=llm_task_index=14_stage=0_iteration=1_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=14_stage=0_iteration=1_n21b7.0dcounterexamplersample_randomp0_s0/pyt_save/model.pt new file mode 100644 index 0000000000000000000000000000000000000000..5c5b9dddc94914cdd2520728566a722bd848e41d --- /dev/null +++ b/reward_1707748949.611114_config.reward_from=llm_task_index=14_stage=0_iteration=1_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=14_stage=0_iteration=1_n21b7.0dcounterexamplersample_randomp0_s0/pyt_save/model.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe9eb815636f624c749b5538b6dec2e1a57cb9e3f6f1f66056932ca973e41db3 +size 26198 diff --git a/reward_1707748949.611114_config.reward_from=llm_task_index=14_stage=0_iteration=1_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=14_stage=0_iteration=1_n21b7.0dcounterexamplersample_randomp0_s0/vars.pkl b/reward_1707748949.611114_config.reward_from=llm_task_index=14_stage=0_iteration=1_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=14_stage=0_iteration=1_n21b7.0dcounterexamplersample_randomp0_s0/vars.pkl new file mode 100644 index 0000000000000000000000000000000000000000..54013b6d6c78aa772e01cfa85fd1268adb8ac11b --- /dev/null +++ b/reward_1707748949.611114_config.reward_from=llm_task_index=14_stage=0_iteration=1_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=14_stage=0_iteration=1_n21b7.0dcounterexamplersample_randomp0_s0/vars.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92ea2e1ec564527e3eda889a660916cf8391e187b0b03eca4b7d2467c96d0991 +size 13916 diff --git a/reward_1707748949.611114_config.reward_from=llm_task_index=14_stage=1_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=14_stage=1_iteration=0_n21b7.0dcounterexamplersample_randomp0_s0/progress.txt b/reward_1707748949.611114_config.reward_from=llm_task_index=14_stage=1_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=14_stage=1_iteration=0_n21b7.0dcounterexamplersample_randomp0_s0/progress.txt new file mode 100644 index 0000000000000000000000000000000000000000..822696dcf7ebc49aacaa9bd9d51f079647b73d9b --- /dev/null +++ b/reward_1707748949.611114_config.reward_from=llm_task_index=14_stage=1_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=14_stage=1_iteration=0_n21b7.0dcounterexamplersample_randomp0_s0/progress.txt @@ -0,0 +1,2 @@ +Epoch AverageEpActualRet StdEpActualRet MaxEpActualRet MinEpActualRet AverageEpLambAdjRet StdEpLambAdjRet MaxEpLambAdjRet MinEpLambAdjRet AverageVVals StdVVals MaxVVals MinVVals Lamb Time +0 214.0 0.0 214.0 214.0 -69.954895 0.0 -69.954895 -69.954895 0.00080094236 0.046026777 0.05988761 -0.07415526 0.332111 1.2477691173553467 diff --git a/reward_1707748949.611114_config.reward_from=llm_task_index=14_stage=1_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=14_stage=1_iteration=0_n21b7.0dcounterexamplersample_randomp0_s0/pyt_save/model.pt b/reward_1707748949.611114_config.reward_from=llm_task_index=14_stage=1_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=14_stage=1_iteration=0_n21b7.0dcounterexamplersample_randomp0_s0/pyt_save/model.pt new file mode 100644 index 0000000000000000000000000000000000000000..093fe7a960698f64fb935ce10f0ef77c28b6c690 --- /dev/null +++ b/reward_1707748949.611114_config.reward_from=llm_task_index=14_stage=1_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=14_stage=1_iteration=0_n21b7.0dcounterexamplersample_randomp0_s0/pyt_save/model.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b6d2ade6820a3cede6670c9a268475e3000e5b7fb0d97e86727b3e05447c99d0 +size 26198 diff --git a/reward_1707748949.611114_config.reward_from=llm_task_index=14_stage=1_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=14_stage=1_iteration=0_n21b7.0dcounterexamplersample_randomp0_s0/vars.pkl b/reward_1707748949.611114_config.reward_from=llm_task_index=14_stage=1_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=14_stage=1_iteration=0_n21b7.0dcounterexamplersample_randomp0_s0/vars.pkl new file mode 100644 index 0000000000000000000000000000000000000000..54013b6d6c78aa772e01cfa85fd1268adb8ac11b --- /dev/null +++ b/reward_1707748949.611114_config.reward_from=llm_task_index=14_stage=1_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=14_stage=1_iteration=0_n21b7.0dcounterexamplersample_randomp0_s0/vars.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92ea2e1ec564527e3eda889a660916cf8391e187b0b03eca4b7d2467c96d0991 +size 13916 diff --git a/reward_1707748949.611114_config.reward_from=llm_task_index=14_stage=1_iteration=1_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=14_stage=1_iteration=1_n21b7.0dcounterexamplersample_randomp0_s0/progress.txt b/reward_1707748949.611114_config.reward_from=llm_task_index=14_stage=1_iteration=1_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=14_stage=1_iteration=1_n21b7.0dcounterexamplersample_randomp0_s0/progress.txt new file mode 100644 index 0000000000000000000000000000000000000000..664d384ef9eb7e7819f30feab71ef77d80fe643d --- /dev/null +++ b/reward_1707748949.611114_config.reward_from=llm_task_index=14_stage=1_iteration=1_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=14_stage=1_iteration=1_n21b7.0dcounterexamplersample_randomp0_s0/progress.txt @@ -0,0 +1,2 @@ +Epoch AverageEpActualRet StdEpActualRet MaxEpActualRet MinEpActualRet AverageEpLambAdjRet StdEpLambAdjRet MaxEpLambAdjRet MinEpLambAdjRet AverageVVals StdVVals MaxVVals MinVVals Lamb Time +0 923.0 0.0 923.0 923.0 590.87384 0.0 590.87384 590.87384 -0.0059993602 0.043736286 0.05904211 -0.07495253 0.34524554 1.3280327320098877 diff --git a/reward_1707748949.611114_config.reward_from=llm_task_index=14_stage=1_iteration=1_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=14_stage=1_iteration=1_n21b7.0dcounterexamplersample_randomp0_s0/pyt_save/model.pt b/reward_1707748949.611114_config.reward_from=llm_task_index=14_stage=1_iteration=1_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=14_stage=1_iteration=1_n21b7.0dcounterexamplersample_randomp0_s0/pyt_save/model.pt new file mode 100644 index 0000000000000000000000000000000000000000..106b7c22657376b6b03a41c899481f9fbf07e0e5 --- /dev/null +++ b/reward_1707748949.611114_config.reward_from=llm_task_index=14_stage=1_iteration=1_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=14_stage=1_iteration=1_n21b7.0dcounterexamplersample_randomp0_s0/pyt_save/model.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a406086c664bee26218c78a53b7223c30506c5165b93c4b401142da600c681b5 +size 26198 diff --git a/reward_1707748949.611114_config.reward_from=llm_task_index=14_stage=1_iteration=1_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=14_stage=1_iteration=1_n21b7.0dcounterexamplersample_randomp0_s0/vars.pkl b/reward_1707748949.611114_config.reward_from=llm_task_index=14_stage=1_iteration=1_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=14_stage=1_iteration=1_n21b7.0dcounterexamplersample_randomp0_s0/vars.pkl new file mode 100644 index 0000000000000000000000000000000000000000..54013b6d6c78aa772e01cfa85fd1268adb8ac11b --- /dev/null +++ b/reward_1707748949.611114_config.reward_from=llm_task_index=14_stage=1_iteration=1_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=14_stage=1_iteration=1_n21b7.0dcounterexamplersample_randomp0_s0/vars.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92ea2e1ec564527e3eda889a660916cf8391e187b0b03eca4b7d2467c96d0991 +size 13916 diff --git a/reward_1707748949.611114_config.reward_from=llm_task_index=15_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=15_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s0/progress.txt b/reward_1707748949.611114_config.reward_from=llm_task_index=15_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=15_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s0/progress.txt new file mode 100644 index 0000000000000000000000000000000000000000..b3d295015777902a6a109dd91266560fffeb2055 --- /dev/null +++ b/reward_1707748949.611114_config.reward_from=llm_task_index=15_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=15_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s0/progress.txt @@ -0,0 +1,2 @@ +Epoch AverageEpActualRet StdEpActualRet MaxEpActualRet MinEpActualRet AverageEpLambAdjRet StdEpLambAdjRet MaxEpLambAdjRet MinEpLambAdjRet AverageVVals StdVVals MaxVVals MinVVals Lamb Time +0 1848.2 0.0 1848.2 1848.2 1559.9917 0.0 1559.9917 1559.9917 -0.0035963813 0.043860883 0.06137715 -0.07274568 0.30890533 1.2274601459503174 diff --git a/reward_1707748949.611114_config.reward_from=llm_task_index=15_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=15_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s0/pyt_save/model.pt b/reward_1707748949.611114_config.reward_from=llm_task_index=15_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=15_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s0/pyt_save/model.pt new file mode 100644 index 0000000000000000000000000000000000000000..7eaf3d9a71641a5d7ada8d5a3d6e3062c55f4eea --- /dev/null +++ b/reward_1707748949.611114_config.reward_from=llm_task_index=15_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=15_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s0/pyt_save/model.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c638df4a59acb30559366536fcc6285741c7b2dc3646efdc4cd87ea036fccb0c +size 26198 diff --git a/reward_1707748949.611114_config.reward_from=llm_task_index=15_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=15_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s0/vars.pkl b/reward_1707748949.611114_config.reward_from=llm_task_index=15_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=15_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s0/vars.pkl new file mode 100644 index 0000000000000000000000000000000000000000..54013b6d6c78aa772e01cfa85fd1268adb8ac11b --- /dev/null +++ b/reward_1707748949.611114_config.reward_from=llm_task_index=15_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=15_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s0/vars.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92ea2e1ec564527e3eda889a660916cf8391e187b0b03eca4b7d2467c96d0991 +size 13916 diff --git a/reward_1707748949.611114_config.reward_from=llm_task_index=15_stage=0_iteration=1_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=15_stage=0_iteration=1_n21b7.0dcounterexamplersample_randomp0_s0/progress.txt b/reward_1707748949.611114_config.reward_from=llm_task_index=15_stage=0_iteration=1_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=15_stage=0_iteration=1_n21b7.0dcounterexamplersample_randomp0_s0/progress.txt new file mode 100644 index 0000000000000000000000000000000000000000..0ddac538769e07141cd42ba6e6d891a0b494694b --- /dev/null +++ b/reward_1707748949.611114_config.reward_from=llm_task_index=15_stage=0_iteration=1_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=15_stage=0_iteration=1_n21b7.0dcounterexamplersample_randomp0_s0/progress.txt @@ -0,0 +1,2 @@ +Epoch AverageEpActualRet StdEpActualRet MaxEpActualRet MinEpActualRet AverageEpLambAdjRet StdEpLambAdjRet MaxEpLambAdjRet MinEpLambAdjRet AverageVVals StdVVals MaxVVals MinVVals Lamb Time +0 25202.5 0.0 25202.5 25202.5 24892.254 0.0 24892.254 24892.254 -0.004313882 0.043747842 0.060352977 -0.073715575 0.3248704 1.2146625518798828 diff --git a/reward_1707748949.611114_config.reward_from=llm_task_index=15_stage=0_iteration=1_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=15_stage=0_iteration=1_n21b7.0dcounterexamplersample_randomp0_s0/pyt_save/model.pt b/reward_1707748949.611114_config.reward_from=llm_task_index=15_stage=0_iteration=1_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=15_stage=0_iteration=1_n21b7.0dcounterexamplersample_randomp0_s0/pyt_save/model.pt new file mode 100644 index 0000000000000000000000000000000000000000..db3691b22b2fe1c016a3443b73f1ed2ee8d465ff --- /dev/null +++ b/reward_1707748949.611114_config.reward_from=llm_task_index=15_stage=0_iteration=1_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=15_stage=0_iteration=1_n21b7.0dcounterexamplersample_randomp0_s0/pyt_save/model.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0bc2f0486657dfe33ac12a426e29cde5f716a457eea69ca9dc4b3829f3c48b3c +size 26198 diff --git a/reward_1707748949.611114_config.reward_from=llm_task_index=15_stage=0_iteration=1_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=15_stage=0_iteration=1_n21b7.0dcounterexamplersample_randomp0_s0/vars.pkl b/reward_1707748949.611114_config.reward_from=llm_task_index=15_stage=0_iteration=1_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=15_stage=0_iteration=1_n21b7.0dcounterexamplersample_randomp0_s0/vars.pkl new file mode 100644 index 0000000000000000000000000000000000000000..54013b6d6c78aa772e01cfa85fd1268adb8ac11b --- /dev/null +++ b/reward_1707748949.611114_config.reward_from=llm_task_index=15_stage=0_iteration=1_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=15_stage=0_iteration=1_n21b7.0dcounterexamplersample_randomp0_s0/vars.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92ea2e1ec564527e3eda889a660916cf8391e187b0b03eca4b7d2467c96d0991 +size 13916 diff --git a/reward_1707748949.611114_config.reward_from=llm_task_index=15_stage=1_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=15_stage=1_iteration=0_n21b7.0dcounterexamplersample_randomp0_s0/progress.txt b/reward_1707748949.611114_config.reward_from=llm_task_index=15_stage=1_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=15_stage=1_iteration=0_n21b7.0dcounterexamplersample_randomp0_s0/progress.txt new file mode 100644 index 0000000000000000000000000000000000000000..9984fef318855f837a504fa6027fc94e2131f3a7 --- /dev/null +++ b/reward_1707748949.611114_config.reward_from=llm_task_index=15_stage=1_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=15_stage=1_iteration=0_n21b7.0dcounterexamplersample_randomp0_s0/progress.txt @@ -0,0 +1,2 @@ +Epoch AverageEpActualRet StdEpActualRet MaxEpActualRet MinEpActualRet AverageEpLambAdjRet StdEpLambAdjRet MaxEpLambAdjRet MinEpLambAdjRet AverageVVals StdVVals MaxVVals MinVVals Lamb Time +0 2973.0 0.0 2973.0 2973.0 2637.7659 0.0 2637.7659 2637.7659 -0.0023830372 0.045824938 0.055983238 -0.07781964 0.39254695 1.1980488300323486 diff --git a/reward_1707748949.611114_config.reward_from=llm_task_index=15_stage=1_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=15_stage=1_iteration=0_n21b7.0dcounterexamplersample_randomp0_s0/pyt_save/model.pt b/reward_1707748949.611114_config.reward_from=llm_task_index=15_stage=1_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=15_stage=1_iteration=0_n21b7.0dcounterexamplersample_randomp0_s0/pyt_save/model.pt new file mode 100644 index 0000000000000000000000000000000000000000..4b2ed0aece8a0f32391a552dca40e5856096ee84 --- /dev/null +++ b/reward_1707748949.611114_config.reward_from=llm_task_index=15_stage=1_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=15_stage=1_iteration=0_n21b7.0dcounterexamplersample_randomp0_s0/pyt_save/model.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c88e2db2f193ae4b3dabd26e8def3434d2c688170c461954b5c36a073a53a222 +size 26198 diff --git a/reward_1707748949.611114_config.reward_from=llm_task_index=15_stage=1_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=15_stage=1_iteration=0_n21b7.0dcounterexamplersample_randomp0_s0/vars.pkl b/reward_1707748949.611114_config.reward_from=llm_task_index=15_stage=1_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=15_stage=1_iteration=0_n21b7.0dcounterexamplersample_randomp0_s0/vars.pkl new file mode 100644 index 0000000000000000000000000000000000000000..54013b6d6c78aa772e01cfa85fd1268adb8ac11b --- /dev/null +++ b/reward_1707748949.611114_config.reward_from=llm_task_index=15_stage=1_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=15_stage=1_iteration=0_n21b7.0dcounterexamplersample_randomp0_s0/vars.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92ea2e1ec564527e3eda889a660916cf8391e187b0b03eca4b7d2467c96d0991 +size 13916 diff --git a/reward_1707748949.611114_config.reward_from=llm_task_index=15_stage=1_iteration=1_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=15_stage=1_iteration=1_n21b7.0dcounterexamplersample_randomp0_s0/progress.txt b/reward_1707748949.611114_config.reward_from=llm_task_index=15_stage=1_iteration=1_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=15_stage=1_iteration=1_n21b7.0dcounterexamplersample_randomp0_s0/progress.txt new file mode 100644 index 0000000000000000000000000000000000000000..7c5261fdb7ba5a592357e998bdd31ff691c637ff --- /dev/null +++ b/reward_1707748949.611114_config.reward_from=llm_task_index=15_stage=1_iteration=1_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=15_stage=1_iteration=1_n21b7.0dcounterexamplersample_randomp0_s0/progress.txt @@ -0,0 +1,2 @@ +Epoch AverageEpActualRet StdEpActualRet MaxEpActualRet MinEpActualRet AverageEpLambAdjRet StdEpLambAdjRet MaxEpLambAdjRet MinEpLambAdjRet AverageVVals StdVVals MaxVVals MinVVals Lamb Time +0 69257.15 0.0 69257.15 69257.15 68971.67 0.0 68971.67 68971.67 -2.2340218e-05 0.044770774 0.060896598 -0.07320111 0.31640127 1.1387743949890137 diff --git a/reward_1707748949.611114_config.reward_from=llm_task_index=15_stage=1_iteration=1_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=15_stage=1_iteration=1_n21b7.0dcounterexamplersample_randomp0_s0/pyt_save/model.pt b/reward_1707748949.611114_config.reward_from=llm_task_index=15_stage=1_iteration=1_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=15_stage=1_iteration=1_n21b7.0dcounterexamplersample_randomp0_s0/pyt_save/model.pt new file mode 100644 index 0000000000000000000000000000000000000000..bc7217c2f4ca097808ccff6ea47e63fa6c71fcf5 --- /dev/null +++ b/reward_1707748949.611114_config.reward_from=llm_task_index=15_stage=1_iteration=1_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=15_stage=1_iteration=1_n21b7.0dcounterexamplersample_randomp0_s0/pyt_save/model.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cdf0d9ab6f67c21b98303a249852b8e82c9160dc8324058929a8d149921b862d +size 26198 diff --git a/reward_1707748949.611114_config.reward_from=llm_task_index=15_stage=1_iteration=1_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=15_stage=1_iteration=1_n21b7.0dcounterexamplersample_randomp0_s0/vars.pkl b/reward_1707748949.611114_config.reward_from=llm_task_index=15_stage=1_iteration=1_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=15_stage=1_iteration=1_n21b7.0dcounterexamplersample_randomp0_s0/vars.pkl new file mode 100644 index 0000000000000000000000000000000000000000..54013b6d6c78aa772e01cfa85fd1268adb8ac11b --- /dev/null +++ b/reward_1707748949.611114_config.reward_from=llm_task_index=15_stage=1_iteration=1_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=15_stage=1_iteration=1_n21b7.0dcounterexamplersample_randomp0_s0/vars.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92ea2e1ec564527e3eda889a660916cf8391e187b0b03eca4b7d2467c96d0991 +size 13916 diff --git a/reward_1707748949.611114_config.reward_from=llm_task_index=16_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=16_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s0/progress.txt b/reward_1707748949.611114_config.reward_from=llm_task_index=16_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=16_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s0/progress.txt new file mode 100644 index 0000000000000000000000000000000000000000..cf4bf180bb0e5e66fc8258614745a1625d60b860 --- /dev/null +++ b/reward_1707748949.611114_config.reward_from=llm_task_index=16_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=16_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s0/progress.txt @@ -0,0 +1,2 @@ +Epoch AverageEpActualRet StdEpActualRet MaxEpActualRet MinEpActualRet AverageEpLambAdjRet StdEpLambAdjRet MaxEpLambAdjRet MinEpLambAdjRet AverageVVals StdVVals MaxVVals MinVVals Lamb Time +0 469.5 0.0 469.5 469.5 171.60954 0.0 171.60954 171.60954 -0.0040375427 0.043836556 0.06109938 -0.07300901 0.3132392 1.1946899890899658 diff --git a/reward_1707748949.611114_config.reward_from=llm_task_index=16_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=16_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s0/pyt_save/model.pt b/reward_1707748949.611114_config.reward_from=llm_task_index=16_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=16_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s0/pyt_save/model.pt new file mode 100644 index 0000000000000000000000000000000000000000..d6f14c5d4aaa8432b1cfaf9ab5b2d055e0ca9646 --- /dev/null +++ b/reward_1707748949.611114_config.reward_from=llm_task_index=16_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=16_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s0/pyt_save/model.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26770c178b59d57b421b86be066216e9012d6524a7a5adc38ee5c6a6ca495c55 +size 26198 diff --git a/reward_1707748949.611114_config.reward_from=llm_task_index=16_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=16_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s0/vars.pkl b/reward_1707748949.611114_config.reward_from=llm_task_index=16_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=16_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s0/vars.pkl new file mode 100644 index 0000000000000000000000000000000000000000..54013b6d6c78aa772e01cfa85fd1268adb8ac11b --- /dev/null +++ b/reward_1707748949.611114_config.reward_from=llm_task_index=16_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=16_stage=0_iteration=0_n21b7.0dcounterexamplersample_randomp0_s0/vars.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92ea2e1ec564527e3eda889a660916cf8391e187b0b03eca4b7d2467c96d0991 +size 13916 diff --git a/reward_1707748949.611114_config.reward_from=llm_task_index=16_stage=0_iteration=1_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=16_stage=0_iteration=1_n21b7.0dcounterexamplersample_randomp0_s0/progress.txt b/reward_1707748949.611114_config.reward_from=llm_task_index=16_stage=0_iteration=1_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=16_stage=0_iteration=1_n21b7.0dcounterexamplersample_randomp0_s0/progress.txt new file mode 100644 index 0000000000000000000000000000000000000000..c079364a11b08ee1bab5a3bd1b4bbaeb692a5004 --- /dev/null +++ b/reward_1707748949.611114_config.reward_from=llm_task_index=16_stage=0_iteration=1_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=16_stage=0_iteration=1_n21b7.0dcounterexamplersample_randomp0_s0/progress.txt @@ -0,0 +1,2 @@ +Epoch AverageEpActualRet StdEpActualRet MaxEpActualRet MinEpActualRet AverageEpLambAdjRet StdEpLambAdjRet MaxEpLambAdjRet MinEpLambAdjRet AverageVVals StdVVals MaxVVals MinVVals Lamb Time +0 588.0 0.0 588.0 588.0 288.50058 0.0 288.50058 288.50058 -0.003655277 0.043775555 0.061117496 -0.07299186 0.31295666 1.225114345550537 diff --git a/reward_1707748949.611114_config.reward_from=llm_task_index=16_stage=0_iteration=1_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=16_stage=0_iteration=1_n21b7.0dcounterexamplersample_randomp0_s0/pyt_save/model.pt b/reward_1707748949.611114_config.reward_from=llm_task_index=16_stage=0_iteration=1_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=16_stage=0_iteration=1_n21b7.0dcounterexamplersample_randomp0_s0/pyt_save/model.pt new file mode 100644 index 0000000000000000000000000000000000000000..5b7ac33440e3c725137ccd3f2da7d614c4e19c30 --- /dev/null +++ b/reward_1707748949.611114_config.reward_from=llm_task_index=16_stage=0_iteration=1_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=16_stage=0_iteration=1_n21b7.0dcounterexamplersample_randomp0_s0/pyt_save/model.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46684c2ff76aeb722ecb3de6abf4ae19fa0b56f8735a182d847af49dda8a4e00 +size 26198 diff --git a/reward_1707748949.611114_config.reward_from=llm_task_index=16_stage=0_iteration=1_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=16_stage=0_iteration=1_n21b7.0dcounterexamplersample_randomp0_s0/vars.pkl b/reward_1707748949.611114_config.reward_from=llm_task_index=16_stage=0_iteration=1_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=16_stage=0_iteration=1_n21b7.0dcounterexamplersample_randomp0_s0/vars.pkl new file mode 100644 index 0000000000000000000000000000000000000000..54013b6d6c78aa772e01cfa85fd1268adb8ac11b --- /dev/null +++ b/reward_1707748949.611114_config.reward_from=llm_task_index=16_stage=0_iteration=1_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=16_stage=0_iteration=1_n21b7.0dcounterexamplersample_randomp0_s0/vars.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92ea2e1ec564527e3eda889a660916cf8391e187b0b03eca4b7d2467c96d0991 +size 13916 diff --git a/reward_1707748949.611114_config.reward_from=llm_task_index=16_stage=1_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=16_stage=1_iteration=0_n21b7.0dcounterexamplersample_randomp0_s0/progress.txt b/reward_1707748949.611114_config.reward_from=llm_task_index=16_stage=1_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=16_stage=1_iteration=0_n21b7.0dcounterexamplersample_randomp0_s0/progress.txt new file mode 100644 index 0000000000000000000000000000000000000000..0b82203e617fcd7ec1b7ecc4bfadbe7a33c137bf --- /dev/null +++ b/reward_1707748949.611114_config.reward_from=llm_task_index=16_stage=1_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=16_stage=1_iteration=0_n21b7.0dcounterexamplersample_randomp0_s0/progress.txt @@ -0,0 +1,2 @@ +Epoch AverageEpActualRet StdEpActualRet MaxEpActualRet MinEpActualRet AverageEpLambAdjRet StdEpLambAdjRet MaxEpLambAdjRet MinEpLambAdjRet AverageVVals StdVVals MaxVVals MinVVals Lamb Time +0 927.0 0.0 927.0 927.0 630.6543 0.0 630.6543 630.6543 -0.004067607 0.043875653 0.061076667 -0.07303053 0.31359354 1.1973612308502197 diff --git a/reward_1707748949.611114_config.reward_from=llm_task_index=16_stage=1_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=16_stage=1_iteration=0_n21b7.0dcounterexamplersample_randomp0_s0/pyt_save/model.pt b/reward_1707748949.611114_config.reward_from=llm_task_index=16_stage=1_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=16_stage=1_iteration=0_n21b7.0dcounterexamplersample_randomp0_s0/pyt_save/model.pt new file mode 100644 index 0000000000000000000000000000000000000000..254c9ecc2deb1880a3ad3f23668b3b4624614f52 --- /dev/null +++ b/reward_1707748949.611114_config.reward_from=llm_task_index=16_stage=1_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=16_stage=1_iteration=0_n21b7.0dcounterexamplersample_randomp0_s0/pyt_save/model.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4e63f45ad9366bce2304a82dae3791513a93e870dd8e78c3b56ff26b9bbb51e +size 26198 diff --git a/reward_1707748949.611114_config.reward_from=llm_task_index=16_stage=1_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=16_stage=1_iteration=0_n21b7.0dcounterexamplersample_randomp0_s0/vars.pkl b/reward_1707748949.611114_config.reward_from=llm_task_index=16_stage=1_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=16_stage=1_iteration=0_n21b7.0dcounterexamplersample_randomp0_s0/vars.pkl new file mode 100644 index 0000000000000000000000000000000000000000..54013b6d6c78aa772e01cfa85fd1268adb8ac11b --- /dev/null +++ b/reward_1707748949.611114_config.reward_from=llm_task_index=16_stage=1_iteration=0_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=16_stage=1_iteration=0_n21b7.0dcounterexamplersample_randomp0_s0/vars.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92ea2e1ec564527e3eda889a660916cf8391e187b0b03eca4b7d2467c96d0991 +size 13916 diff --git a/reward_1707748949.611114_config.reward_from=llm_task_index=16_stage=1_iteration=1_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=16_stage=1_iteration=1_n21b7.0dcounterexamplersample_randomp0_s0/progress.txt b/reward_1707748949.611114_config.reward_from=llm_task_index=16_stage=1_iteration=1_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=16_stage=1_iteration=1_n21b7.0dcounterexamplersample_randomp0_s0/progress.txt new file mode 100644 index 0000000000000000000000000000000000000000..19333a7a97c3386ffd96ad9ad43c26c9fd7f2603 --- /dev/null +++ b/reward_1707748949.611114_config.reward_from=llm_task_index=16_stage=1_iteration=1_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=16_stage=1_iteration=1_n21b7.0dcounterexamplersample_randomp0_s0/progress.txt @@ -0,0 +1,2 @@ +Epoch AverageEpActualRet StdEpActualRet MaxEpActualRet MinEpActualRet AverageEpLambAdjRet StdEpLambAdjRet MaxEpLambAdjRet MinEpLambAdjRet AverageVVals StdVVals MaxVVals MinVVals Lamb Time +0 383.4 0.0 383.4 383.4 73.148766 0.0 73.148766 73.148766 -0.004313882 0.043747842 0.060352977 -0.073715575 0.3248704 1.2039244174957275 diff --git a/reward_1707748949.611114_config.reward_from=llm_task_index=16_stage=1_iteration=1_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=16_stage=1_iteration=1_n21b7.0dcounterexamplersample_randomp0_s0/pyt_save/model.pt b/reward_1707748949.611114_config.reward_from=llm_task_index=16_stage=1_iteration=1_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=16_stage=1_iteration=1_n21b7.0dcounterexamplersample_randomp0_s0/pyt_save/model.pt new file mode 100644 index 0000000000000000000000000000000000000000..c53541a72ce162f2712b652d3185b91ffe2d321b --- /dev/null +++ b/reward_1707748949.611114_config.reward_from=llm_task_index=16_stage=1_iteration=1_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=16_stage=1_iteration=1_n21b7.0dcounterexamplersample_randomp0_s0/pyt_save/model.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22d507741a9072d48bbce88caba49bd7219fc2c27d6ed2ca0edf0aa374bdf8b5 +size 26198 diff --git a/reward_1707748949.611114_config.reward_from=llm_task_index=16_stage=1_iteration=1_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=16_stage=1_iteration=1_n21b7.0dcounterexamplersample_randomp0_s0/vars.pkl b/reward_1707748949.611114_config.reward_from=llm_task_index=16_stage=1_iteration=1_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=16_stage=1_iteration=1_n21b7.0dcounterexamplersample_randomp0_s0/vars.pkl new file mode 100644 index 0000000000000000000000000000000000000000..54013b6d6c78aa772e01cfa85fd1268adb8ac11b --- /dev/null +++ b/reward_1707748949.611114_config.reward_from=llm_task_index=16_stage=1_iteration=1_n21b7.0dcounterexamplersample_randomp0/reward_1707748949.611114_config.reward_from=llm_task_index=16_stage=1_iteration=1_n21b7.0dcounterexamplersample_randomp0_s0/vars.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92ea2e1ec564527e3eda889a660916cf8391e187b0b03eca4b7d2467c96d0991 +size 13916