diff --git a/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-1600/rng_state_0.pth b/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-1600/rng_state_0.pth index 3051249a8f1f6854c494ffaa9ec659d769df95f9..e836937f6531b27630e5e0e51a0fca32d00aff7a 100644 --- a/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-1600/rng_state_0.pth +++ b/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-1600/rng_state_0.pth @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:3bdcf18ad102834bbc193caa9d5ef2599d196518c5cf62c3cb1cdfc481db8199 -size 15109 +oid sha256:ca044fdbd88be2c9695b0bfc45c7f89110cc955c9ea8bc691eca46f0e960a3a3 +size 130 diff --git a/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-1600/rng_state_1.pth b/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-1600/rng_state_1.pth index 30051f1039c04b1e0faf1c8e3983ddd497505aea..c56bb5ac3637b9e3eb6a2071abbde9bd42ee4612 100644 --- a/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-1600/rng_state_1.pth +++ b/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-1600/rng_state_1.pth @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:4585cd50d10b6184d4c05fabcb0a520efcaf963122c89f8e9bca60e29bcee15b -size 15173 +oid sha256:81d5542746ab29db50a33ed3efd9b52249333eecd7db370cba4b8f50889f2495 +size 130 diff --git a/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-1600/rng_state_2.pth b/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-1600/rng_state_2.pth index 552935e458d9155abdb6e2073ae7c1af9a7918a5..c6806a305b7f836bfd257a16e14b1fd274667020 100644 --- a/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-1600/rng_state_2.pth +++ b/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-1600/rng_state_2.pth @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:6faf1ffaa3db03ec15a7c6986f128dc2d3b3762ae5fba2e1acfe2a5d1ed94950 -size 15173 +oid sha256:aa26f1d0701a44bf8fd1e3f7afd1a9bf84613a2bf289ea75779a07bce9ef20d3 +size 130 diff --git a/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-1600/scheduler.pt b/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-1600/scheduler.pt index c447eb13fb9579aab49dd7315069854f0348e0f1..7405e2e997efbd406ab6ccf0e122963d291248cc 100644 --- a/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-1600/scheduler.pt +++ b/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-1600/scheduler.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:8683558bdfece813732a2dfa15cb1742de3b6ec89e63eaa45bde5b05053398f3 -size 1465 +oid sha256:02722db95670c95c8ae55426ac5ca695f542906a64db2f5040a0cf2223d465b4 +size 129 diff --git a/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-1600/tokenizer.json b/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-1600/tokenizer.json index 51ebb3ba93988c73bbd83a3c163a14343fbc5b06..2e1a0e3729e4c303cc9ab0f5935a0af9a6b906a9 100644 --- a/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-1600/tokenizer.json +++ b/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-1600/tokenizer.json @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9c5ae00e602b8860cbd784ba82a8aa14e8feecec692e7076590d014d7b7fdafa -size 11421896 +oid sha256:cedf8734fa1adb8c4ce97738255bb9ae9a474dcc57a219a61df59d32cee881c9 +size 133 diff --git a/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-1600/training_args.bin b/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-1600/training_args.bin index c5bee36fe9f24440ffdbc258d61bc2bb8c7e107d..4f0472d82b56097d6ad0979f839d6e21d0c83bb8 100644 --- a/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-1600/training_args.bin +++ b/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-1600/training_args.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:0aace0e8f51b04b975b33612b86638b384e370113214b2b395f4fe13bec720c7 -size 11921 +oid sha256:3914d42b3a481d0170feb4803e516c76845d6d989117596e7b25e609a52bdc89 +size 130 diff --git a/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-1800/model-00001-of-00004.safetensors b/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-1800/model-00001-of-00004.safetensors index 512d24b7af132834ff429fe7a4e9af37937972c9..2dfa49b99c5407b9022bcc052bf819c5122c0778 100644 --- a/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-1800/model-00001-of-00004.safetensors +++ b/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-1800/model-00001-of-00004.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:fe2111725093259bf7db13b697955e7ad9a98a1cc8a7487c7ba12947aa271e58 -size 4968243304 +oid sha256:0d55ca504fc921aa22682048b6f3423764947df1b801c0c0c00c68113ae6d820 +size 135 diff --git a/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-1800/model-00002-of-00004.safetensors b/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-1800/model-00002-of-00004.safetensors index 149b630cfb260afb0715f4671a895775b85bfb61..6c7c2c264074e85f70e043f09ee6afb7abc7b2eb 100644 --- a/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-1800/model-00002-of-00004.safetensors +++ b/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-1800/model-00002-of-00004.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:5d86b2784e2d2a5cce2923752aef01a2ef0c39618c5365fbc0677bee7ff2864d -size 4991495816 +oid sha256:ea79d0afd3c19f80814076fcf6278252944ae71d123f0977461964c244441daf +size 135 diff --git a/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-1800/model-00003-of-00004.safetensors b/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-1800/model-00003-of-00004.safetensors index d21eccfc5e56367c6cb07e8664f5d57c28e90a4a..b43471f1bf4a994ded4c43d368c7b6ee27cfc651 100644 --- a/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-1800/model-00003-of-00004.safetensors +++ b/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-1800/model-00003-of-00004.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:825fb80ffc0739940e5d91587090502570267b8787871a5ab0d98ecf112fa0bf -size 4932751040 +oid sha256:e983abff204a4ab9280f062713af65f4749995e040e9d02a3f08e94f14c7fd1f +size 135 diff --git a/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-1800/model-00004-of-00004.safetensors b/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-1800/model-00004-of-00004.safetensors index 0590b59e62cc3a833c5518fa8538121a80c656e8..12d8ee29f648d66c8d00025ed84ae16eae8396e2 100644 --- a/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-1800/model-00004-of-00004.safetensors +++ b/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-1800/model-00004-of-00004.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:8b1c07b1a93be2e5b72f4f32463c15021bed0f5f86727073a55046910227fbb6 -size 1691924384 +oid sha256:7178942ef34842e5cb365607d3f4f964fe290ad3fb1970b33db64070e33ab6cf +size 135 diff --git a/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-1800/rng_state_0.pth b/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-1800/rng_state_0.pth index aaa86fe1dd01f5f96fc29ed542eed7bf64843f88..0abf45f85f3bdb4ca6f4d092a7d17010250706b7 100644 --- a/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-1800/rng_state_0.pth +++ b/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-1800/rng_state_0.pth @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:e1627d80330ab147eb89b6ed0f23182a972d2727e5f0d3fae96c084255d52270 -size 15109 +oid sha256:9126fd67f78bb36e497dd1ffd1c188496ee5c850febb75dc4848e770326bf734 +size 130 diff --git a/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-1800/rng_state_1.pth b/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-1800/rng_state_1.pth index 4a79194b4bfc8bfdb082acd3e899b7e7afb8e366..1fe20c345a0e88ffb7e412f2fcc8138732e81e33 100644 --- a/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-1800/rng_state_1.pth +++ b/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-1800/rng_state_1.pth @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:797cd9e6725f0499f0f171f562bb2d8b4536a9abdd6be173420e5d27a526afb8 -size 15173 +oid sha256:9fba81a096ebd3ab8e73ef2baedcbe4c3fc2b6a3d4cb96217807137d883d6ee1 +size 130 diff --git a/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-1800/rng_state_2.pth b/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-1800/rng_state_2.pth index df266b7ea89ccc67006f15596e3bbc5d29140eea..b759fbb088e6d5b5e78da32577a678798b092750 100644 --- a/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-1800/rng_state_2.pth +++ b/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-1800/rng_state_2.pth @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:866dc7e3f46c90cecce31a03f4d4c2460afadaf13bf4d7f23240798a9932c73c -size 15173 +oid sha256:e544572d82996a771d77b4013bd8f8a1f0f59d9e3d10dfb34e806dc69f0d8eb4 +size 130 diff --git a/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-1800/scheduler.pt b/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-1800/scheduler.pt index c0e355b4520c5b287c64a889563396a7ab01ac61..502efc9b9770fa728c9115d9f8e1111e7d6674c5 100644 --- a/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-1800/scheduler.pt +++ b/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-1800/scheduler.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:ae08b0218f323514008a7084502fb613a4d8b378e0b2bc3cf9c36567e1ee6c30 -size 1465 +oid sha256:ef0787a9311031a3e1649d17328b5f6c51f60a60a8e455829d452a2aa83ad683 +size 129 diff --git a/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-1800/tokenizer.json b/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-1800/tokenizer.json index 51ebb3ba93988c73bbd83a3c163a14343fbc5b06..2e1a0e3729e4c303cc9ab0f5935a0af9a6b906a9 100644 --- a/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-1800/tokenizer.json +++ b/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-1800/tokenizer.json @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9c5ae00e602b8860cbd784ba82a8aa14e8feecec692e7076590d014d7b7fdafa -size 11421896 +oid sha256:cedf8734fa1adb8c4ce97738255bb9ae9a474dcc57a219a61df59d32cee881c9 +size 133 diff --git a/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-1800/training_args.bin b/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-1800/training_args.bin index c5bee36fe9f24440ffdbc258d61bc2bb8c7e107d..4f0472d82b56097d6ad0979f839d6e21d0c83bb8 100644 --- a/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-1800/training_args.bin +++ b/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-1800/training_args.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:0aace0e8f51b04b975b33612b86638b384e370113214b2b395f4fe13bec720c7 -size 11921 +oid sha256:3914d42b3a481d0170feb4803e516c76845d6d989117596e7b25e609a52bdc89 +size 130 diff --git a/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-2000/model-00001-of-00004.safetensors b/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-2000/model-00001-of-00004.safetensors index 257f0eb08648e0ebbd99d9d6806dafaf3fc08fa0..29e619c27a4a6615a75d55925c6aca6058a9b8ee 100644 --- a/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-2000/model-00001-of-00004.safetensors +++ b/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-2000/model-00001-of-00004.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:694eeb561d5c0fcd666733d5f3a993582395c78e70513443f424904d00044309 -size 4968243304 +oid sha256:90cbe3f9bf67e76ed9a87d782e0273c82bcd2f92e5b1f431eac6e7530bf4d777 +size 135 diff --git a/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-2000/model-00002-of-00004.safetensors b/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-2000/model-00002-of-00004.safetensors index 2ec58dc75930a4738f4ffa69937d3f9e8295d4da..d272968241f2bed2c6cd2d3b1f84b6e352f0cb2c 100644 --- a/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-2000/model-00002-of-00004.safetensors +++ b/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-2000/model-00002-of-00004.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:33891345d42f9eb9f2081dc1108ca475c90ca8be4bc84de989ab6a852cf451e8 -size 4991495816 +oid sha256:c5c46b2b504233fbf77a547848af0e0968f227a75d4941a4de0df6dd41a6123b +size 135 diff --git a/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-2000/model-00003-of-00004.safetensors b/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-2000/model-00003-of-00004.safetensors index 24e5045bbfa7ffa63e8bc76cbba15a99c16ac42a..13f19533d2023a3a9f3ef10e6e7373c089f7153c 100644 --- a/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-2000/model-00003-of-00004.safetensors +++ b/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-2000/model-00003-of-00004.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:6b5eb55e3427337b13cb390caa6a4a5d80e4126468611b41aef27f3441d314d0 -size 4932751040 +oid sha256:f90c68af19df92f01755d413ba6a86f03a4bdd836e6d48ba2623bef3a0983712 +size 135 diff --git a/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-2000/model-00004-of-00004.safetensors b/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-2000/model-00004-of-00004.safetensors index 1e53dfc59f85c6f583d81890d6350cab7282d025..04aef2a260279e94e8665edf74791878ae16723f 100644 --- a/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-2000/model-00004-of-00004.safetensors +++ b/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-2000/model-00004-of-00004.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9e0eedce4a86e0b70488b175bf5d6504af57ee66b1865f87c5c9cc4169e7fc43 -size 1691924384 +oid sha256:2b5b0a7e224cd294f0a4fecbf00653daedf3955c77299858c47efcd19678ad6f +size 135 diff --git a/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-2000/rng_state_0.pth b/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-2000/rng_state_0.pth index e3bd3b710f87c64db4be127b551a2fda1c148f2d..0807e921478ade933cc9039d758aca194864ac79 100644 --- a/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-2000/rng_state_0.pth +++ b/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-2000/rng_state_0.pth @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:fe4b9c0e955393f546b8b7012c4ffb45564fcdd2abedd0558a6ed60c05d7ee6a -size 15109 +oid sha256:ad06037cab1bfd2b5884de38639011af318199d3d7e3e01e5d0bc2c587d6ddde +size 130 diff --git a/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-2000/rng_state_1.pth b/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-2000/rng_state_1.pth index a40fb4bcd614e3ca7dc7f5b2b284027c31b5008e..2d01b07861f731d4db9b772f96ed277a500dfdfc 100644 --- a/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-2000/rng_state_1.pth +++ b/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-2000/rng_state_1.pth @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:3f89e5ec9f73cd0c0b4adea72b241b4fc86a6585f1665b486ee60b6499a9b156 -size 15173 +oid sha256:5cc6b767a7a6bff7b398dc16e6d641ca7bbd31433c52de33fecb829fa7880d49 +size 130 diff --git a/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-2000/rng_state_2.pth b/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-2000/rng_state_2.pth index abb465e10a88a03b2693feb572ee822663e4793d..854503c404bc3f918a1b5abbb22037940dfcd026 100644 --- a/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-2000/rng_state_2.pth +++ b/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-2000/rng_state_2.pth @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:72019cbfa9da9f357a35599a229a8aaafcae868fc98649adb384c4e7cce4441c -size 15173 +oid sha256:bdb765c4702930159c0ea552b113264f474874cad23a5f5fb11acf9ef287dd69 +size 130 diff --git a/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-2000/scheduler.pt b/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-2000/scheduler.pt index 5a80f57875dcf0d237e105a2548bfbc3021ee65e..0fc6ee755fdb3375fb2310335a63f86e439c1ae7 100644 --- a/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-2000/scheduler.pt +++ b/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-2000/scheduler.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:bd2452db79482eba734decf705de64b633787c31f8b16577195e652e1472cba2 -size 1465 +oid sha256:34219817cb7a4d1e18d5d6051c513959385bea64f63b421d6eff4eec75d31480 +size 129 diff --git a/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-2000/tokenizer.json b/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-2000/tokenizer.json index 51ebb3ba93988c73bbd83a3c163a14343fbc5b06..2e1a0e3729e4c303cc9ab0f5935a0af9a6b906a9 100644 --- a/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-2000/tokenizer.json +++ b/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-2000/tokenizer.json @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9c5ae00e602b8860cbd784ba82a8aa14e8feecec692e7076590d014d7b7fdafa -size 11421896 +oid sha256:cedf8734fa1adb8c4ce97738255bb9ae9a474dcc57a219a61df59d32cee881c9 +size 133 diff --git a/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-2000/training_args.bin b/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-2000/training_args.bin index c5bee36fe9f24440ffdbc258d61bc2bb8c7e107d..4f0472d82b56097d6ad0979f839d6e21d0c83bb8 100644 --- a/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-2000/training_args.bin +++ b/qwen2.5vl-7b-thinking_v2_full_comet_grpo_continue_e8/checkpoint-2000/training_args.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:0aace0e8f51b04b975b33612b86638b384e370113214b2b395f4fe13bec720c7 -size 11921 +oid sha256:3914d42b3a481d0170feb4803e516c76845d6d989117596e7b25e609a52bdc89 +size 130 diff --git a/selective_loss/q7b-thinking_full_v2-spwr_lr2e-6_wd1e-4_a05/v0-20250823-204148/checkpoint-280/model-00001-of-00004.safetensors b/selective_loss/q7b-thinking_full_v2-spwr_lr2e-6_wd1e-4_a05/v0-20250823-204148/checkpoint-280/model-00001-of-00004.safetensors index 4c8fc1d7e816f6099c8f463400583925e760dd97..81c911065992e08ff85574c6180077ba1b5dfdd8 100644 --- a/selective_loss/q7b-thinking_full_v2-spwr_lr2e-6_wd1e-4_a05/v0-20250823-204148/checkpoint-280/model-00001-of-00004.safetensors +++ b/selective_loss/q7b-thinking_full_v2-spwr_lr2e-6_wd1e-4_a05/v0-20250823-204148/checkpoint-280/model-00001-of-00004.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:3fe6cad6f644dcc48b99ddbddcbf099d3430b4a777552d51ea09168b27af6923 -size 4968243304 +oid sha256:7b65547f1ebd2de2bc10a6df51fa81257581b6a9693339e3181fe0e6741d8762 +size 135 diff --git a/selective_loss/q7b-thinking_full_v2-spwr_lr2e-6_wd1e-4_a05/v0-20250823-204148/checkpoint-280/model-00002-of-00004.safetensors b/selective_loss/q7b-thinking_full_v2-spwr_lr2e-6_wd1e-4_a05/v0-20250823-204148/checkpoint-280/model-00002-of-00004.safetensors index 930545b1cfeb184c32b5911d9e7ddf29537d2c4c..ac908849e42465d998be9fa16fbbd9f3e465c360 100644 --- a/selective_loss/q7b-thinking_full_v2-spwr_lr2e-6_wd1e-4_a05/v0-20250823-204148/checkpoint-280/model-00002-of-00004.safetensors +++ b/selective_loss/q7b-thinking_full_v2-spwr_lr2e-6_wd1e-4_a05/v0-20250823-204148/checkpoint-280/model-00002-of-00004.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:2ce8259630edf2c4b8ab3f6d3d7bc973e40342be7ce919c746452b63d2d3ae3b -size 4991495816 +oid sha256:a9a68cb07097f9a9de56e2c2403e105ada6385b27a9f5e93d6e24a7bd6c933ee +size 135 diff --git a/selective_loss/q7b-thinking_full_v2-spwr_lr2e-6_wd1e-4_a05/v0-20250823-204148/checkpoint-280/model-00003-of-00004.safetensors b/selective_loss/q7b-thinking_full_v2-spwr_lr2e-6_wd1e-4_a05/v0-20250823-204148/checkpoint-280/model-00003-of-00004.safetensors index 9033bd775f68872b019381652c93fcb0f3f586fc..600574765495ba038fdd170d0587dca7e2286932 100644 --- a/selective_loss/q7b-thinking_full_v2-spwr_lr2e-6_wd1e-4_a05/v0-20250823-204148/checkpoint-280/model-00003-of-00004.safetensors +++ b/selective_loss/q7b-thinking_full_v2-spwr_lr2e-6_wd1e-4_a05/v0-20250823-204148/checkpoint-280/model-00003-of-00004.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:f2652201fb1f71619629583413948a0a182a654d43ab7bdc10068c14cb16fe58 -size 4932751040 +oid sha256:dbc472bd49f91ae5d66148b64ffd5794fe09970506bc3f278a75c1cff0f3bcb5 +size 135 diff --git a/selective_loss/q7b-thinking_full_v2-spwr_lr2e-6_wd1e-4_a05/v0-20250823-204148/checkpoint-280/model-00004-of-00004.safetensors b/selective_loss/q7b-thinking_full_v2-spwr_lr2e-6_wd1e-4_a05/v0-20250823-204148/checkpoint-280/model-00004-of-00004.safetensors index ad5bf505160827a81f124271209a5f68989768ff..46ffc88cc20fd67699275390f027ab2eeb0c440d 100644 --- a/selective_loss/q7b-thinking_full_v2-spwr_lr2e-6_wd1e-4_a05/v0-20250823-204148/checkpoint-280/model-00004-of-00004.safetensors +++ b/selective_loss/q7b-thinking_full_v2-spwr_lr2e-6_wd1e-4_a05/v0-20250823-204148/checkpoint-280/model-00004-of-00004.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:0191f8d1be7db5111888c383b9ff46248f88c100c7ff998f27d5eb622e233fb9 -size 1691924384 +oid sha256:9b7e8e8370bb5f601804a033a81d4a00d86a1b56badfd6ee944512b20b811788 +size 135 diff --git a/selective_loss/q7b-thinking_full_v2-spwr_lr2e-6_wd1e-4_a05/v0-20250823-204148/checkpoint-280/rng_state_0.pth b/selective_loss/q7b-thinking_full_v2-spwr_lr2e-6_wd1e-4_a05/v0-20250823-204148/checkpoint-280/rng_state_0.pth index e46fa0dc07ae2a7dce5f7bdcc9344699c10b2535..81244c95cef059c3ef7a07e4c0afbfa966866a6b 100644 --- a/selective_loss/q7b-thinking_full_v2-spwr_lr2e-6_wd1e-4_a05/v0-20250823-204148/checkpoint-280/rng_state_0.pth +++ b/selective_loss/q7b-thinking_full_v2-spwr_lr2e-6_wd1e-4_a05/v0-20250823-204148/checkpoint-280/rng_state_0.pth @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:11d4ec11f6f0c4379a450e016e2475ddcdb9f98c890cea685430f774510e454c -size 15365 +oid sha256:ab596e0074fe8fee5443d1dc388174e5b4ad6a05ba78af96806574c6bb4a2e84 +size 130 diff --git a/selective_loss/q7b-thinking_full_v2-spwr_lr2e-6_wd1e-4_a05/v0-20250823-204148/checkpoint-280/rng_state_1.pth b/selective_loss/q7b-thinking_full_v2-spwr_lr2e-6_wd1e-4_a05/v0-20250823-204148/checkpoint-280/rng_state_1.pth index 601cf9dd1bf6339324ff9c9a783f97cd2333b2a3..70a8f9c01a9da74b86e8c0fa06f03774dd63222e 100644 --- a/selective_loss/q7b-thinking_full_v2-spwr_lr2e-6_wd1e-4_a05/v0-20250823-204148/checkpoint-280/rng_state_1.pth +++ b/selective_loss/q7b-thinking_full_v2-spwr_lr2e-6_wd1e-4_a05/v0-20250823-204148/checkpoint-280/rng_state_1.pth @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:15ea0f5e1c543bb6e7297ddedb0c2b9f30373216d289e72c7be8799b46ac0a9e -size 15365 +oid sha256:90957bfca8ef78cb551e5453d61f48d0b114ab396c7d346d33151cdf5017ef40 +size 130 diff --git a/selective_loss/q7b-thinking_full_v2-spwr_lr2e-6_wd1e-4_a05/v0-20250823-204148/checkpoint-280/rng_state_2.pth b/selective_loss/q7b-thinking_full_v2-spwr_lr2e-6_wd1e-4_a05/v0-20250823-204148/checkpoint-280/rng_state_2.pth index bc49f23d63ae85b622e6f33efc0a98d159bbe3c4..1513bc331710d23540ef08f7ec08c0e3369be05c 100644 --- a/selective_loss/q7b-thinking_full_v2-spwr_lr2e-6_wd1e-4_a05/v0-20250823-204148/checkpoint-280/rng_state_2.pth +++ b/selective_loss/q7b-thinking_full_v2-spwr_lr2e-6_wd1e-4_a05/v0-20250823-204148/checkpoint-280/rng_state_2.pth @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:8d8b328f7d4f2bb6648f1f263cde446be2b7d71b86a2fe59e904e9c80bd58c4d -size 15365 +oid sha256:94639ba187fc7fd1451c59ed5b092f649f27e59ef67e18667b9fcf4dc089924d +size 130 diff --git a/selective_loss/q7b-thinking_full_v2-spwr_lr2e-6_wd1e-4_a05/v0-20250823-204148/checkpoint-280/rng_state_3.pth b/selective_loss/q7b-thinking_full_v2-spwr_lr2e-6_wd1e-4_a05/v0-20250823-204148/checkpoint-280/rng_state_3.pth index 4c86b6053a34ad945109eb61ec25ce4ee5098321..500eab6ecee61f1c2be72d94c3afe4e4b3aebaa4 100644 --- a/selective_loss/q7b-thinking_full_v2-spwr_lr2e-6_wd1e-4_a05/v0-20250823-204148/checkpoint-280/rng_state_3.pth +++ b/selective_loss/q7b-thinking_full_v2-spwr_lr2e-6_wd1e-4_a05/v0-20250823-204148/checkpoint-280/rng_state_3.pth @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:449e8d845f7cbbc2f810921abc3f37f01338b84751e2dcde9f14a53ca2fc564b -size 15365 +oid sha256:30f922eea6a11d13452a1305f44f07ba18561e1e7922267b132ba5ac44460daf +size 130 diff --git a/selective_loss/q7b-thinking_full_v2-spwr_lr2e-6_wd1e-4_a05/v0-20250823-204148/checkpoint-280/scheduler.pt b/selective_loss/q7b-thinking_full_v2-spwr_lr2e-6_wd1e-4_a05/v0-20250823-204148/checkpoint-280/scheduler.pt index 299a61ebb90480c491375c71f98658e6f96f23f6..cc4a2add79d33bc858a254b25e45d3a9b1e8c211 100644 --- a/selective_loss/q7b-thinking_full_v2-spwr_lr2e-6_wd1e-4_a05/v0-20250823-204148/checkpoint-280/scheduler.pt +++ b/selective_loss/q7b-thinking_full_v2-spwr_lr2e-6_wd1e-4_a05/v0-20250823-204148/checkpoint-280/scheduler.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:e992dd0fee4e3c06035652b6a642918796d13de583f52aec0ec1a30e35cd2c22 -size 1465 +oid sha256:cdfc4356323d70a975b17c2c0666f5b2f6b6db103ff55d46802eba2ec15cf289 +size 129 diff --git a/selective_loss/q7b-thinking_full_v2-spwr_lr2e-6_wd1e-4_a05/v0-20250823-204148/checkpoint-280/tokenizer.json b/selective_loss/q7b-thinking_full_v2-spwr_lr2e-6_wd1e-4_a05/v0-20250823-204148/checkpoint-280/tokenizer.json index 51ebb3ba93988c73bbd83a3c163a14343fbc5b06..2e1a0e3729e4c303cc9ab0f5935a0af9a6b906a9 100644 --- a/selective_loss/q7b-thinking_full_v2-spwr_lr2e-6_wd1e-4_a05/v0-20250823-204148/checkpoint-280/tokenizer.json +++ b/selective_loss/q7b-thinking_full_v2-spwr_lr2e-6_wd1e-4_a05/v0-20250823-204148/checkpoint-280/tokenizer.json @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9c5ae00e602b8860cbd784ba82a8aa14e8feecec692e7076590d014d7b7fdafa -size 11421896 +oid sha256:cedf8734fa1adb8c4ce97738255bb9ae9a474dcc57a219a61df59d32cee881c9 +size 133 diff --git a/selective_loss/q7b-thinking_full_v2-spwr_lr2e-6_wd1e-4_a05/v0-20250823-204148/checkpoint-280/training_args.bin b/selective_loss/q7b-thinking_full_v2-spwr_lr2e-6_wd1e-4_a05/v0-20250823-204148/checkpoint-280/training_args.bin index 7790b7e56d31d5a550a2f208960629d60dcd5d28..9ae5f912fa2a3b55233591abbaea46599662fe32 100644 --- a/selective_loss/q7b-thinking_full_v2-spwr_lr2e-6_wd1e-4_a05/v0-20250823-204148/checkpoint-280/training_args.bin +++ b/selective_loss/q7b-thinking_full_v2-spwr_lr2e-6_wd1e-4_a05/v0-20250823-204148/checkpoint-280/training_args.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:c12dcc851c6dba6fb08092507182e20bcfc1c15070a953c577e90ce3e7bb81ed -size 8913 +oid sha256:0f87cfe96c2d2da814ff4dcfdcbbda35d8b8a777a4b6e3d40e6945a8817e5a81 +size 129 diff --git a/selective_loss/qwen2.5vl-7b-thinking_full_v2-spwr_lr1e-6_wd1e-3/v0-20250818-120403/checkpoint-280/model-00001-of-00004.safetensors b/selective_loss/qwen2.5vl-7b-thinking_full_v2-spwr_lr1e-6_wd1e-3/v0-20250818-120403/checkpoint-280/model-00001-of-00004.safetensors index 71a6371688de652ea1f144bae10bc02911e9552d..cad389becb99a4dd68e78e1d03f91ccaf8c69115 100644 --- a/selective_loss/qwen2.5vl-7b-thinking_full_v2-spwr_lr1e-6_wd1e-3/v0-20250818-120403/checkpoint-280/model-00001-of-00004.safetensors +++ b/selective_loss/qwen2.5vl-7b-thinking_full_v2-spwr_lr1e-6_wd1e-3/v0-20250818-120403/checkpoint-280/model-00001-of-00004.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:17706758f7c7cb1f2c80df77eeabd396598cc6cf292f4b774ec656f77de7c01e -size 4968243304 +oid sha256:06f542553098ca10b8b11ca140c54a4ba8a4afb6ca08f81651d7765343ab28c3 +size 135 diff --git a/selective_loss/qwen2.5vl-7b-thinking_full_v2-spwr_lr1e-6_wd1e-3/v0-20250818-120403/checkpoint-280/model-00002-of-00004.safetensors b/selective_loss/qwen2.5vl-7b-thinking_full_v2-spwr_lr1e-6_wd1e-3/v0-20250818-120403/checkpoint-280/model-00002-of-00004.safetensors index 2970f08e40b0f3af872f6e3ec1e3c9399e4400b2..b23612f018c40d7822ba23cd6f3268596f090093 100644 --- a/selective_loss/qwen2.5vl-7b-thinking_full_v2-spwr_lr1e-6_wd1e-3/v0-20250818-120403/checkpoint-280/model-00002-of-00004.safetensors +++ b/selective_loss/qwen2.5vl-7b-thinking_full_v2-spwr_lr1e-6_wd1e-3/v0-20250818-120403/checkpoint-280/model-00002-of-00004.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:167976f6a503c767525ae6afb6444641b35a7e2280d6c4bb8fd1c44df20c96c7 -size 4991495816 +oid sha256:8cfd561073b4466168838f29e6ddf9b1014421a81dde330a098393e0b9d4e2b8 +size 135 diff --git a/selective_loss/qwen2.5vl-7b-thinking_full_v2-spwr_lr1e-6_wd1e-3/v0-20250818-120403/checkpoint-280/model-00003-of-00004.safetensors b/selective_loss/qwen2.5vl-7b-thinking_full_v2-spwr_lr1e-6_wd1e-3/v0-20250818-120403/checkpoint-280/model-00003-of-00004.safetensors index 98fe73e66f97a64db6e342b104f3ef4f7e338d29..bcc76f801dc1f0337f670e5d477e2612c3c691c6 100644 --- a/selective_loss/qwen2.5vl-7b-thinking_full_v2-spwr_lr1e-6_wd1e-3/v0-20250818-120403/checkpoint-280/model-00003-of-00004.safetensors +++ b/selective_loss/qwen2.5vl-7b-thinking_full_v2-spwr_lr1e-6_wd1e-3/v0-20250818-120403/checkpoint-280/model-00003-of-00004.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:5be58bbd7ea1fdef3d583c1e41b6cf2bdf5aa51f12e4d14e86ea4a1ffb17493c -size 4932751040 +oid sha256:92fd75303812bb1d8da1d9ad4cc446fa27f4eba63f9f3c4bcc1cb0d50e4cc2fb +size 135 diff --git a/selective_loss/qwen2.5vl-7b-thinking_full_v2-spwr_lr1e-6_wd1e-3/v0-20250818-120403/checkpoint-280/model-00004-of-00004.safetensors b/selective_loss/qwen2.5vl-7b-thinking_full_v2-spwr_lr1e-6_wd1e-3/v0-20250818-120403/checkpoint-280/model-00004-of-00004.safetensors index 3ad32a883722b05647218b9f698953a4e588d468..84e839dfc65af1e11360adcbf275331b75fb675d 100644 --- a/selective_loss/qwen2.5vl-7b-thinking_full_v2-spwr_lr1e-6_wd1e-3/v0-20250818-120403/checkpoint-280/model-00004-of-00004.safetensors +++ b/selective_loss/qwen2.5vl-7b-thinking_full_v2-spwr_lr1e-6_wd1e-3/v0-20250818-120403/checkpoint-280/model-00004-of-00004.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:c5dca6149611e53c0a679bc4e22b9b2bb1246837d1b0062feb6347536732d261 -size 1691924384 +oid sha256:b33377b7eda788192e74c628df7de71db3c1a9cb7561b5f75312c359cbedf2b1 +size 135 diff --git a/selective_loss/qwen2.5vl-7b-thinking_full_v2-spwr_lr1e-6_wd1e-3/v0-20250818-120403/checkpoint-280/rng_state_0.pth b/selective_loss/qwen2.5vl-7b-thinking_full_v2-spwr_lr1e-6_wd1e-3/v0-20250818-120403/checkpoint-280/rng_state_0.pth index e46fa0dc07ae2a7dce5f7bdcc9344699c10b2535..81244c95cef059c3ef7a07e4c0afbfa966866a6b 100644 --- a/selective_loss/qwen2.5vl-7b-thinking_full_v2-spwr_lr1e-6_wd1e-3/v0-20250818-120403/checkpoint-280/rng_state_0.pth +++ b/selective_loss/qwen2.5vl-7b-thinking_full_v2-spwr_lr1e-6_wd1e-3/v0-20250818-120403/checkpoint-280/rng_state_0.pth @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:11d4ec11f6f0c4379a450e016e2475ddcdb9f98c890cea685430f774510e454c -size 15365 +oid sha256:ab596e0074fe8fee5443d1dc388174e5b4ad6a05ba78af96806574c6bb4a2e84 +size 130 diff --git a/selective_loss/qwen2.5vl-7b-thinking_full_v2-spwr_lr1e-6_wd1e-3/v0-20250818-120403/checkpoint-280/rng_state_1.pth b/selective_loss/qwen2.5vl-7b-thinking_full_v2-spwr_lr1e-6_wd1e-3/v0-20250818-120403/checkpoint-280/rng_state_1.pth index 601cf9dd1bf6339324ff9c9a783f97cd2333b2a3..70a8f9c01a9da74b86e8c0fa06f03774dd63222e 100644 --- a/selective_loss/qwen2.5vl-7b-thinking_full_v2-spwr_lr1e-6_wd1e-3/v0-20250818-120403/checkpoint-280/rng_state_1.pth +++ b/selective_loss/qwen2.5vl-7b-thinking_full_v2-spwr_lr1e-6_wd1e-3/v0-20250818-120403/checkpoint-280/rng_state_1.pth @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:15ea0f5e1c543bb6e7297ddedb0c2b9f30373216d289e72c7be8799b46ac0a9e -size 15365 +oid sha256:90957bfca8ef78cb551e5453d61f48d0b114ab396c7d346d33151cdf5017ef40 +size 130 diff --git a/selective_loss/qwen2.5vl-7b-thinking_full_v2-spwr_lr1e-6_wd1e-3/v0-20250818-120403/checkpoint-280/rng_state_2.pth b/selective_loss/qwen2.5vl-7b-thinking_full_v2-spwr_lr1e-6_wd1e-3/v0-20250818-120403/checkpoint-280/rng_state_2.pth index bc49f23d63ae85b622e6f33efc0a98d159bbe3c4..1513bc331710d23540ef08f7ec08c0e3369be05c 100644 --- a/selective_loss/qwen2.5vl-7b-thinking_full_v2-spwr_lr1e-6_wd1e-3/v0-20250818-120403/checkpoint-280/rng_state_2.pth +++ b/selective_loss/qwen2.5vl-7b-thinking_full_v2-spwr_lr1e-6_wd1e-3/v0-20250818-120403/checkpoint-280/rng_state_2.pth @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:8d8b328f7d4f2bb6648f1f263cde446be2b7d71b86a2fe59e904e9c80bd58c4d -size 15365 +oid sha256:94639ba187fc7fd1451c59ed5b092f649f27e59ef67e18667b9fcf4dc089924d +size 130 diff --git a/selective_loss/qwen2.5vl-7b-thinking_full_v2-spwr_lr1e-6_wd1e-3/v0-20250818-120403/checkpoint-280/rng_state_3.pth b/selective_loss/qwen2.5vl-7b-thinking_full_v2-spwr_lr1e-6_wd1e-3/v0-20250818-120403/checkpoint-280/rng_state_3.pth index 4c86b6053a34ad945109eb61ec25ce4ee5098321..500eab6ecee61f1c2be72d94c3afe4e4b3aebaa4 100644 --- a/selective_loss/qwen2.5vl-7b-thinking_full_v2-spwr_lr1e-6_wd1e-3/v0-20250818-120403/checkpoint-280/rng_state_3.pth +++ b/selective_loss/qwen2.5vl-7b-thinking_full_v2-spwr_lr1e-6_wd1e-3/v0-20250818-120403/checkpoint-280/rng_state_3.pth @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:449e8d845f7cbbc2f810921abc3f37f01338b84751e2dcde9f14a53ca2fc564b -size 15365 +oid sha256:30f922eea6a11d13452a1305f44f07ba18561e1e7922267b132ba5ac44460daf +size 130 diff --git a/selective_loss/qwen2.5vl-7b-thinking_full_v2-spwr_lr1e-6_wd1e-3/v0-20250818-120403/checkpoint-280/scheduler.pt b/selective_loss/qwen2.5vl-7b-thinking_full_v2-spwr_lr1e-6_wd1e-3/v0-20250818-120403/checkpoint-280/scheduler.pt index 6fbfcffac232af47e44c2216441c9709b3b0f525..b0699865e423f5b6466e02b4ddeb5698386211a0 100644 --- a/selective_loss/qwen2.5vl-7b-thinking_full_v2-spwr_lr1e-6_wd1e-3/v0-20250818-120403/checkpoint-280/scheduler.pt +++ b/selective_loss/qwen2.5vl-7b-thinking_full_v2-spwr_lr1e-6_wd1e-3/v0-20250818-120403/checkpoint-280/scheduler.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:ded1c312c0e169d37c17d82545a7b599a226f1381cc3d6a0a3500e997da33658 -size 1465 +oid sha256:f3bcc3c3d0cfbdf4fd8be460f9fd21e6c8cce075b79a0097c9b8dfd0ce5609e5 +size 129 diff --git a/selective_loss/qwen2.5vl-7b-thinking_full_v2-spwr_lr1e-6_wd1e-3/v0-20250818-120403/checkpoint-280/tokenizer.json b/selective_loss/qwen2.5vl-7b-thinking_full_v2-spwr_lr1e-6_wd1e-3/v0-20250818-120403/checkpoint-280/tokenizer.json index 51ebb3ba93988c73bbd83a3c163a14343fbc5b06..2e1a0e3729e4c303cc9ab0f5935a0af9a6b906a9 100644 --- a/selective_loss/qwen2.5vl-7b-thinking_full_v2-spwr_lr1e-6_wd1e-3/v0-20250818-120403/checkpoint-280/tokenizer.json +++ b/selective_loss/qwen2.5vl-7b-thinking_full_v2-spwr_lr1e-6_wd1e-3/v0-20250818-120403/checkpoint-280/tokenizer.json @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9c5ae00e602b8860cbd784ba82a8aa14e8feecec692e7076590d014d7b7fdafa -size 11421896 +oid sha256:cedf8734fa1adb8c4ce97738255bb9ae9a474dcc57a219a61df59d32cee881c9 +size 133 diff --git a/selective_loss/qwen2.5vl-7b-thinking_full_v2-spwr_lr1e-6_wd1e-3/v0-20250818-120403/checkpoint-280/training_args.bin b/selective_loss/qwen2.5vl-7b-thinking_full_v2-spwr_lr1e-6_wd1e-3/v0-20250818-120403/checkpoint-280/training_args.bin index 11f5f5ce925a6cb424d48157b48e1390579c29a6..4f4e760fd2a899a262849ab78e1cac535f28ba32 100644 --- a/selective_loss/qwen2.5vl-7b-thinking_full_v2-spwr_lr1e-6_wd1e-3/v0-20250818-120403/checkpoint-280/training_args.bin +++ b/selective_loss/qwen2.5vl-7b-thinking_full_v2-spwr_lr1e-6_wd1e-3/v0-20250818-120403/checkpoint-280/training_args.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:8deca80007589896177b99c4708d5623c0515e925b518deddbbea74b7e6394fe -size 8977 +oid sha256:16f72f1b618b0050138182932a053d99c3cee17f630978a203aedc7ae12dd11d +size 129 diff --git a/selective_loss/qwen2.5vl-7b-thinking_full_v2-spwr_lr2e-6_wd1e-4/v1-20250818-111947/checkpoint-280/model-00001-of-00004.safetensors b/selective_loss/qwen2.5vl-7b-thinking_full_v2-spwr_lr2e-6_wd1e-4/v1-20250818-111947/checkpoint-280/model-00001-of-00004.safetensors index 56bc642afe5a1cd5c4b021cb0b7145bcff017cc8..c856041ce10fb3d44fb4d2f47f6964a84459e46f 100644 --- a/selective_loss/qwen2.5vl-7b-thinking_full_v2-spwr_lr2e-6_wd1e-4/v1-20250818-111947/checkpoint-280/model-00001-of-00004.safetensors +++ b/selective_loss/qwen2.5vl-7b-thinking_full_v2-spwr_lr2e-6_wd1e-4/v1-20250818-111947/checkpoint-280/model-00001-of-00004.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:8ba52632de46207532bcfbb2a7410c0abc7e09bb218bad4d41ea5c8ddf8eb7d0 -size 4968243304 +oid sha256:9def51748090bdcdd44f2ee8c0f50d76ac11e5a5fe2b204bf567cf97831f8a5c +size 135 diff --git a/selective_loss/qwen2.5vl-7b-thinking_full_v2-spwr_lr2e-6_wd1e-4/v1-20250818-111947/checkpoint-280/model-00002-of-00004.safetensors b/selective_loss/qwen2.5vl-7b-thinking_full_v2-spwr_lr2e-6_wd1e-4/v1-20250818-111947/checkpoint-280/model-00002-of-00004.safetensors index d3e57152977cd68691ac041ca988a1a0cda5e53e..5598e4716e1516585bba62d4ad9ce8c8dbfa0703 100644 --- a/selective_loss/qwen2.5vl-7b-thinking_full_v2-spwr_lr2e-6_wd1e-4/v1-20250818-111947/checkpoint-280/model-00002-of-00004.safetensors +++ b/selective_loss/qwen2.5vl-7b-thinking_full_v2-spwr_lr2e-6_wd1e-4/v1-20250818-111947/checkpoint-280/model-00002-of-00004.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:62683729b4392e03077ef7a9cf1f87ede86f7f53e6446a5a977464e11d9bc2ef -size 4991495816 +oid sha256:360a6a8cc6cf615136a7fe93f5260cd0398b391d6e2f2e141db55d4b8d640d1d +size 135 diff --git a/selective_loss/qwen2.5vl-7b-thinking_full_v2-spwr_lr2e-6_wd1e-4/v1-20250818-111947/checkpoint-280/model-00003-of-00004.safetensors b/selective_loss/qwen2.5vl-7b-thinking_full_v2-spwr_lr2e-6_wd1e-4/v1-20250818-111947/checkpoint-280/model-00003-of-00004.safetensors index cd8f343c5a6acb3dcbed4e76a767d7c93a9b0168..257c3f428d604b9795add529aa9a89d14ff7859a 100644 --- a/selective_loss/qwen2.5vl-7b-thinking_full_v2-spwr_lr2e-6_wd1e-4/v1-20250818-111947/checkpoint-280/model-00003-of-00004.safetensors +++ b/selective_loss/qwen2.5vl-7b-thinking_full_v2-spwr_lr2e-6_wd1e-4/v1-20250818-111947/checkpoint-280/model-00003-of-00004.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:cd5600af79a897971f0543e958f12b95a59f06b840cffb777984979a807399f9 -size 4932751040 +oid sha256:67163f2b95c4e8ffa32294c4bf3568a2240c048f4e4d54f4838e768b0fbb34bc +size 135 diff --git a/selective_loss/qwen2.5vl-7b-thinking_full_v2-spwr_lr2e-6_wd1e-4/v1-20250818-111947/checkpoint-280/model-00004-of-00004.safetensors b/selective_loss/qwen2.5vl-7b-thinking_full_v2-spwr_lr2e-6_wd1e-4/v1-20250818-111947/checkpoint-280/model-00004-of-00004.safetensors index a4f9058a249cdb8a0b56de8c5e478b689792e0bb..b5e7a84481133d6f990b6fc4e7ec55fccddacd94 100644 --- a/selective_loss/qwen2.5vl-7b-thinking_full_v2-spwr_lr2e-6_wd1e-4/v1-20250818-111947/checkpoint-280/model-00004-of-00004.safetensors +++ b/selective_loss/qwen2.5vl-7b-thinking_full_v2-spwr_lr2e-6_wd1e-4/v1-20250818-111947/checkpoint-280/model-00004-of-00004.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:171c19c630e25ee1668449d8869778646a9e7d97ba104f49dddd7b5ef706ba25 -size 1691924384 +oid sha256:fec8abff3f8c92cde60623c42f22366948f2e7fe2fb23ddfd56aab827bdaac93 +size 135 diff --git a/selective_loss/qwen2.5vl-7b-thinking_full_v2-spwr_lr2e-6_wd1e-4/v1-20250818-111947/checkpoint-280/rng_state_0.pth b/selective_loss/qwen2.5vl-7b-thinking_full_v2-spwr_lr2e-6_wd1e-4/v1-20250818-111947/checkpoint-280/rng_state_0.pth index e46fa0dc07ae2a7dce5f7bdcc9344699c10b2535..81244c95cef059c3ef7a07e4c0afbfa966866a6b 100644 --- a/selective_loss/qwen2.5vl-7b-thinking_full_v2-spwr_lr2e-6_wd1e-4/v1-20250818-111947/checkpoint-280/rng_state_0.pth +++ b/selective_loss/qwen2.5vl-7b-thinking_full_v2-spwr_lr2e-6_wd1e-4/v1-20250818-111947/checkpoint-280/rng_state_0.pth @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:11d4ec11f6f0c4379a450e016e2475ddcdb9f98c890cea685430f774510e454c -size 15365 +oid sha256:ab596e0074fe8fee5443d1dc388174e5b4ad6a05ba78af96806574c6bb4a2e84 +size 130 diff --git a/selective_loss/qwen2.5vl-7b-thinking_full_v2-spwr_lr2e-6_wd1e-4/v1-20250818-111947/checkpoint-280/rng_state_1.pth b/selective_loss/qwen2.5vl-7b-thinking_full_v2-spwr_lr2e-6_wd1e-4/v1-20250818-111947/checkpoint-280/rng_state_1.pth index 601cf9dd1bf6339324ff9c9a783f97cd2333b2a3..70a8f9c01a9da74b86e8c0fa06f03774dd63222e 100644 --- a/selective_loss/qwen2.5vl-7b-thinking_full_v2-spwr_lr2e-6_wd1e-4/v1-20250818-111947/checkpoint-280/rng_state_1.pth +++ b/selective_loss/qwen2.5vl-7b-thinking_full_v2-spwr_lr2e-6_wd1e-4/v1-20250818-111947/checkpoint-280/rng_state_1.pth @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:15ea0f5e1c543bb6e7297ddedb0c2b9f30373216d289e72c7be8799b46ac0a9e -size 15365 +oid sha256:90957bfca8ef78cb551e5453d61f48d0b114ab396c7d346d33151cdf5017ef40 +size 130 diff --git a/selective_loss/qwen2.5vl-7b-thinking_full_v2-spwr_lr2e-6_wd1e-4/v1-20250818-111947/checkpoint-280/rng_state_2.pth b/selective_loss/qwen2.5vl-7b-thinking_full_v2-spwr_lr2e-6_wd1e-4/v1-20250818-111947/checkpoint-280/rng_state_2.pth index bc49f23d63ae85b622e6f33efc0a98d159bbe3c4..1513bc331710d23540ef08f7ec08c0e3369be05c 100644 --- a/selective_loss/qwen2.5vl-7b-thinking_full_v2-spwr_lr2e-6_wd1e-4/v1-20250818-111947/checkpoint-280/rng_state_2.pth +++ b/selective_loss/qwen2.5vl-7b-thinking_full_v2-spwr_lr2e-6_wd1e-4/v1-20250818-111947/checkpoint-280/rng_state_2.pth @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:8d8b328f7d4f2bb6648f1f263cde446be2b7d71b86a2fe59e904e9c80bd58c4d -size 15365 +oid sha256:94639ba187fc7fd1451c59ed5b092f649f27e59ef67e18667b9fcf4dc089924d +size 130 diff --git a/selective_loss/qwen2.5vl-7b-thinking_full_v2-spwr_lr2e-6_wd1e-4/v1-20250818-111947/checkpoint-280/rng_state_3.pth b/selective_loss/qwen2.5vl-7b-thinking_full_v2-spwr_lr2e-6_wd1e-4/v1-20250818-111947/checkpoint-280/rng_state_3.pth index 4c86b6053a34ad945109eb61ec25ce4ee5098321..500eab6ecee61f1c2be72d94c3afe4e4b3aebaa4 100644 --- a/selective_loss/qwen2.5vl-7b-thinking_full_v2-spwr_lr2e-6_wd1e-4/v1-20250818-111947/checkpoint-280/rng_state_3.pth +++ b/selective_loss/qwen2.5vl-7b-thinking_full_v2-spwr_lr2e-6_wd1e-4/v1-20250818-111947/checkpoint-280/rng_state_3.pth @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:449e8d845f7cbbc2f810921abc3f37f01338b84751e2dcde9f14a53ca2fc564b -size 15365 +oid sha256:30f922eea6a11d13452a1305f44f07ba18561e1e7922267b132ba5ac44460daf +size 130 diff --git a/selective_loss/qwen2.5vl-7b-thinking_full_v2-spwr_lr2e-6_wd1e-4/v1-20250818-111947/checkpoint-280/scheduler.pt b/selective_loss/qwen2.5vl-7b-thinking_full_v2-spwr_lr2e-6_wd1e-4/v1-20250818-111947/checkpoint-280/scheduler.pt index 299a61ebb90480c491375c71f98658e6f96f23f6..cc4a2add79d33bc858a254b25e45d3a9b1e8c211 100644 --- a/selective_loss/qwen2.5vl-7b-thinking_full_v2-spwr_lr2e-6_wd1e-4/v1-20250818-111947/checkpoint-280/scheduler.pt +++ b/selective_loss/qwen2.5vl-7b-thinking_full_v2-spwr_lr2e-6_wd1e-4/v1-20250818-111947/checkpoint-280/scheduler.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:e992dd0fee4e3c06035652b6a642918796d13de583f52aec0ec1a30e35cd2c22 -size 1465 +oid sha256:cdfc4356323d70a975b17c2c0666f5b2f6b6db103ff55d46802eba2ec15cf289 +size 129 diff --git a/selective_loss/qwen2.5vl-7b-thinking_full_v2-spwr_lr2e-6_wd1e-4/v1-20250818-111947/checkpoint-280/tokenizer.json b/selective_loss/qwen2.5vl-7b-thinking_full_v2-spwr_lr2e-6_wd1e-4/v1-20250818-111947/checkpoint-280/tokenizer.json index 51ebb3ba93988c73bbd83a3c163a14343fbc5b06..2e1a0e3729e4c303cc9ab0f5935a0af9a6b906a9 100644 --- a/selective_loss/qwen2.5vl-7b-thinking_full_v2-spwr_lr2e-6_wd1e-4/v1-20250818-111947/checkpoint-280/tokenizer.json +++ b/selective_loss/qwen2.5vl-7b-thinking_full_v2-spwr_lr2e-6_wd1e-4/v1-20250818-111947/checkpoint-280/tokenizer.json @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9c5ae00e602b8860cbd784ba82a8aa14e8feecec692e7076590d014d7b7fdafa -size 11421896 +oid sha256:cedf8734fa1adb8c4ce97738255bb9ae9a474dcc57a219a61df59d32cee881c9 +size 133 diff --git a/selective_loss/qwen2.5vl-7b-thinking_full_v2-spwr_lr2e-6_wd1e-4/v1-20250818-111947/checkpoint-280/training_args.bin b/selective_loss/qwen2.5vl-7b-thinking_full_v2-spwr_lr2e-6_wd1e-4/v1-20250818-111947/checkpoint-280/training_args.bin index 6abe8e2207680b11fd1c919264cb7f48f675045d..e6058a79e711895b780f5244bfa284bc9c729bce 100644 --- a/selective_loss/qwen2.5vl-7b-thinking_full_v2-spwr_lr2e-6_wd1e-4/v1-20250818-111947/checkpoint-280/training_args.bin +++ b/selective_loss/qwen2.5vl-7b-thinking_full_v2-spwr_lr2e-6_wd1e-4/v1-20250818-111947/checkpoint-280/training_args.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:1d038e3e209f79fe63458c3eecd194e4dd3cc7d9df8ffbf96195b0fa73bf53c3 -size 8977 +oid sha256:998e1e09a84fd0e640b9986ec1b9d5e8bc131d6bf77473f813053d9e80995c03 +size 129