diff --git a/dapo_lorafa_20251201_161746/checkpoint-128/rng_state_0.pth b/dapo_lorafa_20251201_161746/checkpoint-128/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..c04ead12a24ab71cc2140a9769cc236f46e852eb --- /dev/null +++ b/dapo_lorafa_20251201_161746/checkpoint-128/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5403a013b2bd368c8e10adb794e948e02e5156007e735e20772e548430d5475a +size 15365 diff --git a/dapo_lorafa_20251201_161746/checkpoint-128/rng_state_1.pth b/dapo_lorafa_20251201_161746/checkpoint-128/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..24b3b938722ed28fa6adde43dcfda108beddb82e --- /dev/null +++ b/dapo_lorafa_20251201_161746/checkpoint-128/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28b2ac11696807b7e88b2659a47dff10ad92318a9f37058ff500f219a18ee625 +size 15429 diff --git a/dapo_lorafa_20251201_161746/checkpoint-128/rng_state_2.pth b/dapo_lorafa_20251201_161746/checkpoint-128/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..5c28d77bb05672721a2ac6725bef0c22719da835 --- /dev/null +++ b/dapo_lorafa_20251201_161746/checkpoint-128/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8feb3027a0db03c9a827d2cd00e7d5ae9e999fcc4a8ab0ff1a99fc1f7b0b5f1e +size 15429 diff --git a/dapo_lorafa_20251201_161746/checkpoint-128/rng_state_3.pth b/dapo_lorafa_20251201_161746/checkpoint-128/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..14a35be582228665c16b730925a56ef52e93cb9e --- /dev/null +++ b/dapo_lorafa_20251201_161746/checkpoint-128/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4ae7fb98b8b83fbf151b68ad0bc1352928d36cf5b489bca43cedae5ec0d0a4e +size 15429 diff --git a/dapo_lorafa_20251201_161746/checkpoint-128/scheduler.pt b/dapo_lorafa_20251201_161746/checkpoint-128/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d08ae64295b57090bbaa5d6676253533d838873 --- /dev/null +++ b/dapo_lorafa_20251201_161746/checkpoint-128/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a72d1751ecd37a23ecd20bd8b9260f394c2f370cb5db8d203bad7d01395f4fb8 +size 1465 diff --git a/dapo_lorafa_20251201_161746/checkpoint-128/training_args.bin b/dapo_lorafa_20251201_161746/checkpoint-128/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..63c3421a8b566700bf579035beda17ca249df912 --- /dev/null +++ b/dapo_lorafa_20251201_161746/checkpoint-128/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2cd9fc68413aadb7b7d40e9384c483b1d5cb1998f40011e96c2faa43e1188d7d +size 8849 diff --git a/dapo_lorafa_20251201_161746/checkpoint-192/adapter_model.safetensors b/dapo_lorafa_20251201_161746/checkpoint-192/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8354bf0490232945bd5f7394a081ba63d0e2e47a --- /dev/null +++ b/dapo_lorafa_20251201_161746/checkpoint-192/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:068b118f3431e74bc82c76906c6c26ecaabbef38208a3cea1996d01893c85dbf +size 73911504 diff --git a/dapo_lorafa_20251201_161746/checkpoint-192/rng_state_0.pth b/dapo_lorafa_20251201_161746/checkpoint-192/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..9ca79fc703760f37d8469b9e6ce9af5a1a059224 --- /dev/null +++ b/dapo_lorafa_20251201_161746/checkpoint-192/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f22615c296c292b94f7d4a2684ac471e513cd17c7e2e6acfe1029b84d0f8393 +size 15365 diff --git a/dapo_lorafa_20251201_161746/checkpoint-192/rng_state_1.pth b/dapo_lorafa_20251201_161746/checkpoint-192/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..b31db0ab3278c77f1ccd5630d74d1ae66bae8988 --- /dev/null +++ b/dapo_lorafa_20251201_161746/checkpoint-192/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86309256de33f69cf31766561c1664c1c586a73f197b074b2fb21252f97ca43b +size 15429 diff --git a/dapo_lorafa_20251201_161746/checkpoint-192/rng_state_2.pth b/dapo_lorafa_20251201_161746/checkpoint-192/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..13d57f9cd69252e2219a9f68f4efc3268277e802 --- /dev/null +++ b/dapo_lorafa_20251201_161746/checkpoint-192/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2460b7a465fbad58eda8e661c6e4cd55ec7f66c3d5e12eec9a1be24ef75d18fb +size 15429 diff --git a/dapo_lorafa_20251201_161746/checkpoint-192/rng_state_3.pth b/dapo_lorafa_20251201_161746/checkpoint-192/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..90bb0d5d9531efadf5cc519461a6990b8489b1db --- /dev/null +++ b/dapo_lorafa_20251201_161746/checkpoint-192/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3948ea425a5ba037c0a53e4c26a9cba635ec159214fe7a46e3e19b63a8f8f287 +size 15429 diff --git a/dapo_lorafa_20251201_161746/checkpoint-192/scheduler.pt b/dapo_lorafa_20251201_161746/checkpoint-192/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb4e8900ca74d271df161df3e78c5e3163d3ca2c --- /dev/null +++ b/dapo_lorafa_20251201_161746/checkpoint-192/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ac63e93328a0491bc31c5b67747712626467b0c1fab68bd8f3a90d2ffc2d318 +size 1465 diff --git a/dapo_lorafa_20251201_161746/checkpoint-192/training_args.bin b/dapo_lorafa_20251201_161746/checkpoint-192/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..63c3421a8b566700bf579035beda17ca249df912 --- /dev/null +++ b/dapo_lorafa_20251201_161746/checkpoint-192/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2cd9fc68413aadb7b7d40e9384c483b1d5cb1998f40011e96c2faa43e1188d7d +size 8849 diff --git a/dapo_lorafa_20251201_161746/checkpoint-256/adapter_model.safetensors b/dapo_lorafa_20251201_161746/checkpoint-256/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8b40d80ce2e2487375efddeee5249110e2967ab0 --- /dev/null +++ b/dapo_lorafa_20251201_161746/checkpoint-256/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41906e01107a02c0b2b8687ca3b784170b88029755156748d2adffb4b16a6188 +size 73911504 diff --git a/dapo_lorafa_20251201_161746/checkpoint-256/rng_state_0.pth b/dapo_lorafa_20251201_161746/checkpoint-256/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..c2e532b750ba74231a957e8d704e2aa12bafa67c --- /dev/null +++ b/dapo_lorafa_20251201_161746/checkpoint-256/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc9faa666c8e2527ea7bed23897b39d33080af7cccb4078e68ca0c896b5d8195 +size 15365 diff --git a/dapo_lorafa_20251201_161746/checkpoint-256/rng_state_1.pth b/dapo_lorafa_20251201_161746/checkpoint-256/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..1c4106748d74bb32c527454e6748fe3da7ed37ed --- /dev/null +++ b/dapo_lorafa_20251201_161746/checkpoint-256/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58a16332f011af8c1b24f3f970160aa16d895f8d07206b52ed81aa3e6660e02b +size 15429 diff --git a/dapo_lorafa_20251201_161746/checkpoint-256/rng_state_2.pth b/dapo_lorafa_20251201_161746/checkpoint-256/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..a6ff39559d7f346fd81a89130dec8b74f2c93f07 --- /dev/null +++ b/dapo_lorafa_20251201_161746/checkpoint-256/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e36acfb44e91aff8cbc0069f327291b85586996e8f2a2dd9582b7472a9cf221 +size 15429 diff --git a/dapo_lorafa_20251201_161746/checkpoint-256/rng_state_3.pth b/dapo_lorafa_20251201_161746/checkpoint-256/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..493dd1f1f6736f4c9aae79487e1adb395035c9b8 --- /dev/null +++ b/dapo_lorafa_20251201_161746/checkpoint-256/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae6efc86b6ba7dbe7bca217f58ff5501185e82b30ad63c05d45b8af1a7e0286a +size 15429 diff --git a/dapo_lorafa_20251201_161746/checkpoint-256/scheduler.pt b/dapo_lorafa_20251201_161746/checkpoint-256/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..5da175406e5951634027623c46687436be96a222 --- /dev/null +++ b/dapo_lorafa_20251201_161746/checkpoint-256/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8495f527d2ae384d255f961a1b604892e1f5459d17e99146a7b64167ecb9365 +size 1465 diff --git a/dapo_lorafa_20251201_161746/checkpoint-256/training_args.bin b/dapo_lorafa_20251201_161746/checkpoint-256/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..63c3421a8b566700bf579035beda17ca249df912 --- /dev/null +++ b/dapo_lorafa_20251201_161746/checkpoint-256/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2cd9fc68413aadb7b7d40e9384c483b1d5cb1998f40011e96c2faa43e1188d7d +size 8849 diff --git a/dapo_lorafa_20251201_161746/checkpoint-320/adapter_model.safetensors b/dapo_lorafa_20251201_161746/checkpoint-320/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e9ca0b8b1ad5f6b5d1e3707e0e9d98aeff2119b8 --- /dev/null +++ b/dapo_lorafa_20251201_161746/checkpoint-320/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b881d268d05cf8f00b00108670145daaeb98db5c002523a22cbbab5ae0787a49 +size 73911504 diff --git a/dapo_lorafa_20251201_161746/checkpoint-320/rng_state_0.pth b/dapo_lorafa_20251201_161746/checkpoint-320/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..d6f57c7b82219239984e8d695eddb6fe9c86cea7 --- /dev/null +++ b/dapo_lorafa_20251201_161746/checkpoint-320/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:474379631942f97dcd10d88b87f826f0d91083dd19639e07c40ada064b252fa6 +size 15365 diff --git a/dapo_lorafa_20251201_161746/checkpoint-320/rng_state_1.pth b/dapo_lorafa_20251201_161746/checkpoint-320/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..51a9682c44e844ee9cbfe10273916ede28ce68a6 --- /dev/null +++ b/dapo_lorafa_20251201_161746/checkpoint-320/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec4cb64222679a191edb4e2a0d732a7f3c6dff618aac4145aa5de5751c4e52d9 +size 15429 diff --git a/dapo_lorafa_20251201_161746/checkpoint-320/rng_state_2.pth b/dapo_lorafa_20251201_161746/checkpoint-320/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..e90ab0ad64ec7c6de0a70500f0d9c544b521a6ab --- /dev/null +++ b/dapo_lorafa_20251201_161746/checkpoint-320/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55a5dc7b6767259798144c909b3a686e83fd9cd7182fd586413549ae4fa25a91 +size 15429 diff --git a/dapo_lorafa_20251201_161746/checkpoint-320/rng_state_3.pth b/dapo_lorafa_20251201_161746/checkpoint-320/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..5a39e9e5367c82794456e721a8f670e74b2a0f14 --- /dev/null +++ b/dapo_lorafa_20251201_161746/checkpoint-320/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b3a6a8c5ec77d8147b0468cc9c99964921e53637e8998e06782c32eb89a1d35 +size 15429 diff --git a/dapo_lorafa_20251201_161746/checkpoint-320/scheduler.pt b/dapo_lorafa_20251201_161746/checkpoint-320/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..0b635ce1666c50e816d388484f117d6c351b92d3 --- /dev/null +++ b/dapo_lorafa_20251201_161746/checkpoint-320/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da013ae0b2b98d7666c2dc2fe7c1c09f26c72a818d58bd9b5b49a1d1f432bd5a +size 1465 diff --git a/dapo_lorafa_20251201_161746/checkpoint-320/training_args.bin b/dapo_lorafa_20251201_161746/checkpoint-320/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..63c3421a8b566700bf579035beda17ca249df912 --- /dev/null +++ b/dapo_lorafa_20251201_161746/checkpoint-320/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2cd9fc68413aadb7b7d40e9384c483b1d5cb1998f40011e96c2faa43e1188d7d +size 8849 diff --git a/dapo_lorafa_20251201_161746/checkpoint-384/adapter_model.safetensors b/dapo_lorafa_20251201_161746/checkpoint-384/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3a9fceacc27a75e18dda1939f0d0a76c38e1e6a7 --- /dev/null +++ b/dapo_lorafa_20251201_161746/checkpoint-384/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41dc8e9d0f7fdd58e14a843c38058acb9fac560a009ddd7e027bab3ced39fd51 +size 73911504 diff --git a/dapo_lorafa_20251201_161746/checkpoint-384/rng_state_0.pth b/dapo_lorafa_20251201_161746/checkpoint-384/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..9beeb83767d77824f8e53df1c6b5ab65da6319e5 --- /dev/null +++ b/dapo_lorafa_20251201_161746/checkpoint-384/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42549f40898560280fe13a0e1ebae0e79fe7aa741e669df97c783436b01c67f7 +size 15365 diff --git a/dapo_lorafa_20251201_161746/checkpoint-384/rng_state_1.pth b/dapo_lorafa_20251201_161746/checkpoint-384/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..936a02037094d5838a9b861a8304bd84902d6d8b --- /dev/null +++ b/dapo_lorafa_20251201_161746/checkpoint-384/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7d87c4e6cbdf18bd6014e757352bf82d3914cb91e503521fac74e2890ce4384 +size 15429 diff --git a/dapo_lorafa_20251201_161746/checkpoint-384/rng_state_2.pth b/dapo_lorafa_20251201_161746/checkpoint-384/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..be1e090c1a6c13004522825f8c68409805708cb2 --- /dev/null +++ b/dapo_lorafa_20251201_161746/checkpoint-384/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1ee8dd453eeb0012860333b3e3cdb72439e89beef7d52192520bccf0566e1ba +size 15429 diff --git a/dapo_lorafa_20251201_161746/checkpoint-384/rng_state_3.pth b/dapo_lorafa_20251201_161746/checkpoint-384/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..fef216671d7b2024cd6c4600c3f5ea312e8cbca0 --- /dev/null +++ b/dapo_lorafa_20251201_161746/checkpoint-384/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ea94f512aaa0d2d85550541adcb83232f4eb2cd0725cc72148e509b2b65a609 +size 15429 diff --git a/dapo_lorafa_20251201_161746/checkpoint-384/scheduler.pt b/dapo_lorafa_20251201_161746/checkpoint-384/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..e35447364346dd4e48ff2912c9630fa0d550dd81 --- /dev/null +++ b/dapo_lorafa_20251201_161746/checkpoint-384/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a73b3132edc693a316dd18b0560b36c0fb0501d1030453a31a1309122a6bf7c +size 1465 diff --git a/dapo_lorafa_20251201_161746/checkpoint-384/training_args.bin b/dapo_lorafa_20251201_161746/checkpoint-384/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..63c3421a8b566700bf579035beda17ca249df912 --- /dev/null +++ b/dapo_lorafa_20251201_161746/checkpoint-384/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2cd9fc68413aadb7b7d40e9384c483b1d5cb1998f40011e96c2faa43e1188d7d +size 8849 diff --git a/dapo_lorafa_20251201_161746/checkpoint-448/adapter_model.safetensors b/dapo_lorafa_20251201_161746/checkpoint-448/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d46a6b0cdc5ace2e1c92041388745856ecf2c184 --- /dev/null +++ b/dapo_lorafa_20251201_161746/checkpoint-448/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2864f248ac1a0e2b41a0e8c09dde419af85f1e36c7aff865d16f79e610f74937 +size 73911504 diff --git a/dapo_lorafa_20251201_161746/checkpoint-448/rng_state_0.pth b/dapo_lorafa_20251201_161746/checkpoint-448/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..76ada4e530232beef6490051e63ad703a96045b8 --- /dev/null +++ b/dapo_lorafa_20251201_161746/checkpoint-448/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:464f3e435a719ef25b0a0acf5fd89f24cd9032e1483578a815d6eaa85a6b4aeb +size 15365 diff --git a/dapo_lorafa_20251201_161746/checkpoint-448/rng_state_1.pth b/dapo_lorafa_20251201_161746/checkpoint-448/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..82d71a7f119d97f05eaf57a9cd7088d01b1bf55c --- /dev/null +++ b/dapo_lorafa_20251201_161746/checkpoint-448/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:950d831d58008d526753c0b15e6f2cc23be06c994ae140e2d759a6d9c3d9222f +size 15429 diff --git a/dapo_lorafa_20251201_161746/checkpoint-448/rng_state_2.pth b/dapo_lorafa_20251201_161746/checkpoint-448/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..cb2f1b7fa7252779afe5cb9d6fa041e2e14f45b4 --- /dev/null +++ b/dapo_lorafa_20251201_161746/checkpoint-448/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b999c479874fc4618d2b415742c29331bb5f3e8cea6095ae7568f79bf31267d4 +size 15429 diff --git a/dapo_lorafa_20251201_161746/checkpoint-448/rng_state_3.pth b/dapo_lorafa_20251201_161746/checkpoint-448/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..aa657e05dfb4403686648745832fa9e7ec046b34 --- /dev/null +++ b/dapo_lorafa_20251201_161746/checkpoint-448/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae1e026c04a975ef010155ec5c74a4846524d6a169fcbae23ac2c17ff83704fa +size 15429 diff --git a/dapo_lorafa_20251201_161746/checkpoint-448/scheduler.pt b/dapo_lorafa_20251201_161746/checkpoint-448/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a39d5aae7a5de28bbf7c8e26531da9f7f0cda3e --- /dev/null +++ b/dapo_lorafa_20251201_161746/checkpoint-448/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89d50e6c2130ded251cbd3fb239e3a2e1e0564766292c69bfb4aa6ba0d973844 +size 1465 diff --git a/dapo_lorafa_20251201_161746/checkpoint-448/training_args.bin b/dapo_lorafa_20251201_161746/checkpoint-448/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..63c3421a8b566700bf579035beda17ca249df912 --- /dev/null +++ b/dapo_lorafa_20251201_161746/checkpoint-448/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2cd9fc68413aadb7b7d40e9384c483b1d5cb1998f40011e96c2faa43e1188d7d +size 8849 diff --git a/dapo_lorafa_20251201_161746/checkpoint-512/global_step512/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/dapo_lorafa_20251201_161746/checkpoint-512/global_step512/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c670972297c209254080ad49781dc57f5069816c --- /dev/null +++ b/dapo_lorafa_20251201_161746/checkpoint-512/global_step512/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1324198f9e2a83f5d6b0289fa567d667ef43e0ab6f789764ef6d7a7470a62c09 +size 61940613 diff --git a/dapo_lorafa_20251201_161746/checkpoint-512/global_step512/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/dapo_lorafa_20251201_161746/checkpoint-512/global_step512/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c12f8923cfb1f56a2cc24f8e6ccd379e9bd81617 --- /dev/null +++ b/dapo_lorafa_20251201_161746/checkpoint-512/global_step512/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a785d16b712baeae3cec50b3c776682d277ea9034a6033d7315056e2aacd5a24 +size 61940677 diff --git a/dapo_lorafa_20251201_161746/checkpoint-512/global_step512/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/dapo_lorafa_20251201_161746/checkpoint-512/global_step512/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..de617e5c859fe509bb6ff59fa199a38e6c7c0d5f --- /dev/null +++ b/dapo_lorafa_20251201_161746/checkpoint-512/global_step512/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2926d221c12822c4647f38936e065fcde93e10e5c4bbbe9e4b38771192db673b +size 61940677 diff --git a/dapo_lorafa_20251201_161746/checkpoint-512/global_step512/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/dapo_lorafa_20251201_161746/checkpoint-512/global_step512/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7a133f2705d9f9d2e6fdbe7b11234675693bb1af --- /dev/null +++ b/dapo_lorafa_20251201_161746/checkpoint-512/global_step512/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:161f1ddb765796581d03ea6fe8f3733aaf3c0d50d3cc1c001b055b742a133c7f +size 61940677 diff --git a/dapo_lorafa_20251201_161746/checkpoint-512/global_step512/mp_rank_00_model_states.pt b/dapo_lorafa_20251201_161746/checkpoint-512/global_step512/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aad195e01e72aa410798eb93a831dffb7a84df03 --- /dev/null +++ b/dapo_lorafa_20251201_161746/checkpoint-512/global_step512/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6d8e203679d7f3f4c251282b829d3fbdbe41f1abfee0d0d4a5bde298310a7f9 +size 41536409 diff --git a/dapo_lorafa_20251201_161746/checkpoint-512/rng_state_0.pth b/dapo_lorafa_20251201_161746/checkpoint-512/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..931f223924fd9241ace77eae277c0b28490ed0cc --- /dev/null +++ b/dapo_lorafa_20251201_161746/checkpoint-512/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16a1ee699fc26c915ca96e8548f6f3c81ed445b02961bbc0a07b374a835a57a0 +size 15365 diff --git a/dapo_lorafa_20251201_161746/checkpoint-512/rng_state_1.pth b/dapo_lorafa_20251201_161746/checkpoint-512/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..ef164c39bc7a8a95ca9cbacb10380f7a559788d9 --- /dev/null +++ b/dapo_lorafa_20251201_161746/checkpoint-512/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa8682b5053bcd2602bf90520e3d0ba99e95e9e06560548fc593be433b7dab6f +size 15429 diff --git a/dapo_lorafa_20251201_161746/checkpoint-512/rng_state_2.pth b/dapo_lorafa_20251201_161746/checkpoint-512/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..6ba07d09d944fe026d96b91c1e045c9c66c3377a --- /dev/null +++ b/dapo_lorafa_20251201_161746/checkpoint-512/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6081adf9c570536f946f75c6cbc3344cf207e9da0d995a9b8f6bd2c3b3a5288 +size 15429 diff --git a/dapo_lorafa_20251201_161746/checkpoint-512/rng_state_3.pth b/dapo_lorafa_20251201_161746/checkpoint-512/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..406b0e4bdb3e8917ee9a2abb5d6363a958935913 --- /dev/null +++ b/dapo_lorafa_20251201_161746/checkpoint-512/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc4ffda786efeaeb17c67ef7db631f3842ea8a5e1d78a04a9d99c9fe8d1fc97a +size 15429 diff --git a/dapo_lorafa_20251201_161746/checkpoint-512/scheduler.pt b/dapo_lorafa_20251201_161746/checkpoint-512/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..4800a9e5803399b265ffcab0af9c3fe980dbd948 --- /dev/null +++ b/dapo_lorafa_20251201_161746/checkpoint-512/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c0e61c4f166edd4bd232bd6fbefe6d67a5b7e00cb803d1741eac9a6d2b7b6ee +size 1465 diff --git a/dapo_lorafa_20251201_161746/checkpoint-64/adapter_model.safetensors b/dapo_lorafa_20251201_161746/checkpoint-64/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..52454e0a151a57bee08973a7062cd144fa1b4717 --- /dev/null +++ b/dapo_lorafa_20251201_161746/checkpoint-64/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:688a28015553090c333efd41b55763bfa3993913ab4892d20ee007b428e5346f +size 73911504 diff --git a/dapo_lorafa_20251201_161746/checkpoint-64/rng_state_3.pth b/dapo_lorafa_20251201_161746/checkpoint-64/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..9a1f16d4eecda8348573567e7ab39cb80e10d515 --- /dev/null +++ b/dapo_lorafa_20251201_161746/checkpoint-64/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:162d6ac3a8627082c298eb943a9ef9fe6186c2502018c1ff3c02004c6711f535 +size 15429 diff --git a/dr_grpo_lora_20251130_192918/checkpoint-256/rng_state_0.pth b/dr_grpo_lora_20251130_192918/checkpoint-256/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..c37f65416ef131f7639dd4e113ac6211856e41bd --- /dev/null +++ b/dr_grpo_lora_20251130_192918/checkpoint-256/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8fe2e5ae8b3c55da3806cd635dafd2bd67ff200151d461efc2c6bd5c375f0a98 +size 15365 diff --git a/dr_grpo_lora_20251130_192918/checkpoint-320/training_args.bin b/dr_grpo_lora_20251130_192918/checkpoint-320/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..1ec0bcd20c557848df5808d72f346bb69c0a3c51 --- /dev/null +++ b/dr_grpo_lora_20251130_192918/checkpoint-320/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83cd5486d5180d58247f637807acbe17122c3efc1e32ddc464dc2fac8f414516 +size 8849 diff --git a/dr_grpo_lora_20251130_192918/checkpoint-384/rng_state_1.pth b/dr_grpo_lora_20251130_192918/checkpoint-384/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..14151094bf0bafe40d3faad4c12212cc9c4bf3e4 --- /dev/null +++ b/dr_grpo_lora_20251130_192918/checkpoint-384/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1544ed6013fbf8804d76cbe0dacdf361af3b424d541bce2179a76955f69d1525 +size 15429 diff --git a/dr_grpo_lora_20251130_192918/checkpoint-448/training_args.bin b/dr_grpo_lora_20251130_192918/checkpoint-448/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..1ec0bcd20c557848df5808d72f346bb69c0a3c51 --- /dev/null +++ b/dr_grpo_lora_20251130_192918/checkpoint-448/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83cd5486d5180d58247f637807acbe17122c3efc1e32ddc464dc2fac8f414516 +size 8849 diff --git a/dr_grpo_lora_20251130_192918/checkpoint-512/rng_state_0.pth b/dr_grpo_lora_20251130_192918/checkpoint-512/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..7296ca135d33aa3728a740d983084a551d952773 --- /dev/null +++ b/dr_grpo_lora_20251130_192918/checkpoint-512/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f637ee6504027d1b6e4274d84848d8221a5ff687c00e3f7a6a0351e5c212517e +size 15365 diff --git a/dr_grpo_lora_20251130_192918/checkpoint-512/rng_state_1.pth b/dr_grpo_lora_20251130_192918/checkpoint-512/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..2e0166fe1a1b079e30717482290b2276351b2957 --- /dev/null +++ b/dr_grpo_lora_20251130_192918/checkpoint-512/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ec5ceed77e858bea2810992f0b9234597f6b358a6af2cbc742ff0a0e454d7a7 +size 15429 diff --git a/dr_grpo_lora_20251130_192918/checkpoint-512/rng_state_2.pth b/dr_grpo_lora_20251130_192918/checkpoint-512/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..d066065fc598e6016d2f6371a837859ac2a66f7b --- /dev/null +++ b/dr_grpo_lora_20251130_192918/checkpoint-512/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6028549d0547b58f0affaab7284a747ece762a11c5464612410be950ab0da9c7 +size 15429 diff --git a/dr_grpo_lora_20251130_192918/checkpoint-512/rng_state_3.pth b/dr_grpo_lora_20251130_192918/checkpoint-512/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..aa055e24028151c29d0adf3184f2f707cbca00c7 --- /dev/null +++ b/dr_grpo_lora_20251130_192918/checkpoint-512/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:910c6a511c42312c4fed7f00941c2901d34c51f864a054a0e4768bc81a3b5eaa +size 15429 diff --git a/dr_grpo_lora_20251130_192918/checkpoint-512/scheduler.pt b/dr_grpo_lora_20251130_192918/checkpoint-512/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..4800a9e5803399b265ffcab0af9c3fe980dbd948 --- /dev/null +++ b/dr_grpo_lora_20251130_192918/checkpoint-512/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c0e61c4f166edd4bd232bd6fbefe6d67a5b7e00cb803d1741eac9a6d2b7b6ee +size 1465 diff --git a/dr_grpo_lora_20251130_192918/checkpoint-576/rng_state_1.pth b/dr_grpo_lora_20251130_192918/checkpoint-576/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..3cd25c4c833bb21fe5e7b182231ec7f5e48f5072 --- /dev/null +++ b/dr_grpo_lora_20251130_192918/checkpoint-576/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ec4083e1635a72dab9251269fcf7ef5eafb509acc0684df360e1b0c7fbd3ec5 +size 15429 diff --git a/dr_grpo_lora_20251130_192918/checkpoint-576/rng_state_2.pth b/dr_grpo_lora_20251130_192918/checkpoint-576/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..e7d68df2c5cef321f995233c1b8a2d918358ca3f --- /dev/null +++ b/dr_grpo_lora_20251130_192918/checkpoint-576/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51fc9c991a7e7d4907ffc8ebc1e927ea54dfddd627244fbaeccbc0279d9f8aab +size 15429 diff --git a/dr_grpo_lora_20251130_192918/checkpoint-576/rng_state_3.pth b/dr_grpo_lora_20251130_192918/checkpoint-576/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..4577c3da178b4e7d0b96748f7798dd044bfbf389 --- /dev/null +++ b/dr_grpo_lora_20251130_192918/checkpoint-576/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bcd6def0b1d0c93b6a4d9b20c08d5f50ac256f7dac52601d93a9c20762640fe4 +size 15429 diff --git a/dr_grpo_lora_20251130_192918/checkpoint-576/scheduler.pt b/dr_grpo_lora_20251130_192918/checkpoint-576/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..454813a4990df191f6951cdef743cc653ff31f83 --- /dev/null +++ b/dr_grpo_lora_20251130_192918/checkpoint-576/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:105f4404298e62d6811a76a80078eaf19c435d835ba8926a324f78dfdc9fb5f1 +size 1465 diff --git a/dr_grpo_lora_20251130_192918/checkpoint-576/training_args.bin b/dr_grpo_lora_20251130_192918/checkpoint-576/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..1ec0bcd20c557848df5808d72f346bb69c0a3c51 --- /dev/null +++ b/dr_grpo_lora_20251130_192918/checkpoint-576/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83cd5486d5180d58247f637807acbe17122c3efc1e32ddc464dc2fac8f414516 +size 8849 diff --git a/dr_grpo_lora_20251130_192918/checkpoint-64/rng_state_0.pth b/dr_grpo_lora_20251130_192918/checkpoint-64/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..04a1af57d0b9f923923c9203b6b2787d73895808 --- /dev/null +++ b/dr_grpo_lora_20251130_192918/checkpoint-64/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f17fe94476c27fddc13aeae00339fb5155e671611d5e18a7f50dcdf490aa9c67 +size 15365 diff --git a/dr_grpo_lora_20251130_192918/checkpoint-64/rng_state_1.pth b/dr_grpo_lora_20251130_192918/checkpoint-64/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..c9cf94143509d5ff3b3fd72604139afde22422cf --- /dev/null +++ b/dr_grpo_lora_20251130_192918/checkpoint-64/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73194c8a560f2ee0700ccfe61a7f94f76c25b882684e6a681353e1b9cc43b4b7 +size 15429 diff --git a/dr_grpo_lora_20251130_192918/checkpoint-64/rng_state_2.pth b/dr_grpo_lora_20251130_192918/checkpoint-64/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..14e187451273740eaa863f07558ed99465a58835 --- /dev/null +++ b/dr_grpo_lora_20251130_192918/checkpoint-64/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86e4bdbcafd63d84165652521b357239487038a3481da009ff86f8382b82bb31 +size 15429 diff --git a/dr_grpo_lora_20251130_192918/checkpoint-64/rng_state_3.pth b/dr_grpo_lora_20251130_192918/checkpoint-64/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..1388e573caf1782c87eb573a3c397ba2d2a81a8c --- /dev/null +++ b/dr_grpo_lora_20251130_192918/checkpoint-64/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:092398bc98e3947cbdf172f34c94ab83683bf39eba6e89984f4346fa7f6c75ba +size 15429 diff --git a/dr_grpo_lora_20251130_192918/checkpoint-64/scheduler.pt b/dr_grpo_lora_20251130_192918/checkpoint-64/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..5f18e6fbca95d9546e2f67129f5c8f7ba7da9e16 --- /dev/null +++ b/dr_grpo_lora_20251130_192918/checkpoint-64/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93cefd10607223128e502b13dda034a13939769cee1c2b5c47751dc1ef0425c6 +size 1465 diff --git a/dr_grpo_lora_20251130_192918/checkpoint-64/training_args.bin b/dr_grpo_lora_20251130_192918/checkpoint-64/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..1ec0bcd20c557848df5808d72f346bb69c0a3c51 --- /dev/null +++ b/dr_grpo_lora_20251130_192918/checkpoint-64/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83cd5486d5180d58247f637807acbe17122c3efc1e32ddc464dc2fac8f414516 +size 8849 diff --git a/dr_grpo_lora_20251130_192918/checkpoint-640/rng_state_0.pth b/dr_grpo_lora_20251130_192918/checkpoint-640/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..4c5df3b18e487c6cf837ea504c7342d7c308bdb9 --- /dev/null +++ b/dr_grpo_lora_20251130_192918/checkpoint-640/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6fc1b92a0eee3555f123ef2e489901ad7e3e037d265d5a8933e684fff5011c88 +size 15365 diff --git a/dr_grpo_lora_20251130_192918/checkpoint-640/rng_state_1.pth b/dr_grpo_lora_20251130_192918/checkpoint-640/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..7d7d0253f39784bdc652dcb2326136350b849ac0 --- /dev/null +++ b/dr_grpo_lora_20251130_192918/checkpoint-640/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84226b783f051f9e05009b3698b4a78b2594b82074ce0dbc882bdb6464fa2706 +size 15429 diff --git a/dr_grpo_lora_20251130_192918/checkpoint-640/rng_state_2.pth b/dr_grpo_lora_20251130_192918/checkpoint-640/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..761dbb6d52a2da2c5b5bce1fb9922cdf70ca7d5b --- /dev/null +++ b/dr_grpo_lora_20251130_192918/checkpoint-640/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f18616a7f9b3be53a7c91467191be90862f1e73abf0224c8396df20b02285eca +size 15429 diff --git a/dr_grpo_lora_20251130_192918/checkpoint-640/rng_state_3.pth b/dr_grpo_lora_20251130_192918/checkpoint-640/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..9573921411621c1e687b5f240d68ede770e69d06 --- /dev/null +++ b/dr_grpo_lora_20251130_192918/checkpoint-640/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5deb6c0893e9218d06b524d8d881210ce3a80698b8dd48dcf7b014d528dc9ff4 +size 15429 diff --git a/dr_grpo_lora_20251130_192918/checkpoint-640/scheduler.pt b/dr_grpo_lora_20251130_192918/checkpoint-640/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce72654f572f2506f27160b816a295cb0b390c16 --- /dev/null +++ b/dr_grpo_lora_20251130_192918/checkpoint-640/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a218931437f4ccf43b090350bb40ee3df136a61635dc16c5ca38673a829c2bdb +size 1465 diff --git a/dr_grpo_lora_20251130_192918/checkpoint-640/training_args.bin b/dr_grpo_lora_20251130_192918/checkpoint-640/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..1ec0bcd20c557848df5808d72f346bb69c0a3c51 --- /dev/null +++ b/dr_grpo_lora_20251130_192918/checkpoint-640/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83cd5486d5180d58247f637807acbe17122c3efc1e32ddc464dc2fac8f414516 +size 8849 diff --git a/dr_grpo_lora_20251130_192918/checkpoint-704/rng_state_0.pth b/dr_grpo_lora_20251130_192918/checkpoint-704/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..a0de00aa5e0665dd6799ce37584dce8d9cc47e91 --- /dev/null +++ b/dr_grpo_lora_20251130_192918/checkpoint-704/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:730ce8214a75fe862694e3fbd13ef9dcce149ac6046a6916c1b51ffa4a832041 +size 15365 diff --git a/dr_grpo_lora_20251130_192918/checkpoint-704/rng_state_1.pth b/dr_grpo_lora_20251130_192918/checkpoint-704/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..5f8a2ca19870e6a43c3692668b870f3ad0009e6a --- /dev/null +++ b/dr_grpo_lora_20251130_192918/checkpoint-704/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:899b58c04339213949d5ab04e0c3942a4f72fd6eda516f7ca8fdb83b0ad2d00a +size 15429 diff --git a/dr_grpo_lora_20251130_192918/checkpoint-704/rng_state_2.pth b/dr_grpo_lora_20251130_192918/checkpoint-704/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..ee1ff8c1f368b03c7d23a489226dccc33106b9d6 --- /dev/null +++ b/dr_grpo_lora_20251130_192918/checkpoint-704/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5874452ae57121b6784d269da40fbcf6c2dbbc4779490f2a84e7433116e4eb6 +size 15429 diff --git a/dr_grpo_lora_20251130_192918/checkpoint-704/rng_state_3.pth b/dr_grpo_lora_20251130_192918/checkpoint-704/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..c0242c39d21e8b8648e1457dd4695a1e6769fa36 --- /dev/null +++ b/dr_grpo_lora_20251130_192918/checkpoint-704/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27073815110cf1150e0600a915c88fee6b22580a61420084a9ff4d5cfe4af4fe +size 15429 diff --git a/dr_grpo_lora_20251130_192918/checkpoint-704/scheduler.pt b/dr_grpo_lora_20251130_192918/checkpoint-704/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..fed940bed83776fee227b5936c168e6282b54594 --- /dev/null +++ b/dr_grpo_lora_20251130_192918/checkpoint-704/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11998cc5f35748b7722fb0b2c7a077a4a3e3b00ac72b4ef20efa3259e7892c63 +size 1465 diff --git a/dr_grpo_lora_20251130_192918/checkpoint-704/training_args.bin b/dr_grpo_lora_20251130_192918/checkpoint-704/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..1ec0bcd20c557848df5808d72f346bb69c0a3c51 --- /dev/null +++ b/dr_grpo_lora_20251130_192918/checkpoint-704/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83cd5486d5180d58247f637807acbe17122c3efc1e32ddc464dc2fac8f414516 +size 8849 diff --git a/dr_grpo_lora_20251130_192918/checkpoint-768/rng_state_0.pth b/dr_grpo_lora_20251130_192918/checkpoint-768/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..d6695b986d9f4244f6c78352f1d642fc2d79a81d --- /dev/null +++ b/dr_grpo_lora_20251130_192918/checkpoint-768/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14608224dbc6bf41dd773e2c53baa31fae57786ce90b7d12c193026a19636514 +size 15365 diff --git a/dr_grpo_lora_20251130_192918/checkpoint-768/rng_state_1.pth b/dr_grpo_lora_20251130_192918/checkpoint-768/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..62470800db6d9bf58f65b9619706e064976e8af4 --- /dev/null +++ b/dr_grpo_lora_20251130_192918/checkpoint-768/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8293aa6aa24cba78e31499863f833d4c811d6958fddb974717a82fc4f842aa3b +size 15429 diff --git a/dr_grpo_lora_20251130_192918/checkpoint-768/rng_state_2.pth b/dr_grpo_lora_20251130_192918/checkpoint-768/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..f69281a818fbb84f3ed09324acf258c167bd58d5 --- /dev/null +++ b/dr_grpo_lora_20251130_192918/checkpoint-768/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4651a4bc96587ccb1987eae889e66ee471824c7e69ed70fceece3b04fffc5a86 +size 15429 diff --git a/dr_grpo_lora_20251130_192918/checkpoint-768/rng_state_3.pth b/dr_grpo_lora_20251130_192918/checkpoint-768/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..77ba314c40c80988e65645d049329407189da888 --- /dev/null +++ b/dr_grpo_lora_20251130_192918/checkpoint-768/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07fba42cf13c971eb573cd20d7077027bc8e4b530f62d9e39035a9069dc70030 +size 15429