diff --git a/.gitattributes b/.gitattributes index 8c88070d66a30ef5071f8725ea7af848a3df2395..628b290ec6a698bda0c22e5ed48f20b0ddc0e268 100644 --- a/.gitattributes +++ b/.gitattributes @@ -144,3 +144,45 @@ dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-896/tokenizer.json filter=lf dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-960/tokenizer.json filter=lfs diff=lfs merge=lfs -text dapo_miss_openmath_20251129_124147/tokenizer.json filter=lfs diff=lfs merge=lfs -text grpo_full_qwen2_5_3b_20251121_111716/checkpoint-896/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-576/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_lora_r8_20251129_135342/checkpoint-832/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_lora_r8_20251129_135342/checkpoint-896/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_lora_r8_20251129_135342/checkpoint-960/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_milora_qwen2_5_1_5b_20251126_224006/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-256/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-320/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-384/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-512/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-448/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_lora_r8_20251129_135342/checkpoint-704/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_lora_r8_20251129_135342/checkpoint-768/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-896/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-960/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_lora_r8_20251129_135342/checkpoint-1024/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_lora_r8_20251129_135342/checkpoint-320/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_lora_r8_20251129_135342/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_lora_r8_20251129_135342/checkpoint-192/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_lora_r8_20251129_135342/checkpoint-256/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_lora_r8_20251129_135342/checkpoint-128/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_lora_r8_20251129_135342/checkpoint-384/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_lora_r8_20251129_135342/checkpoint-64/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_lora_r8_20251129_135342/checkpoint-448/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_lora_r8_20251129_135342/checkpoint-576/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_lora_r8_20251129_135342/checkpoint-512/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_lora_r8_20251129_135342/checkpoint-640/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_miss_openmath_20251129_124147/checkpoint-1024/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_miss_openmath_20251129_124147/checkpoint-128/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_miss_openmath_20251129_124147/checkpoint-192/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_miss_openmath_20251129_124147/checkpoint-256/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-128/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-1024/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-192/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-256/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-448/tokenizer.json filter=lfs diff=lfs merge=lfs -text +grpo_full_qwen2_5_3b_20251121_111716/checkpoint-384/tokenizer.json filter=lfs diff=lfs merge=lfs -text +grpo_full_qwen2_5_3b_20251121_111716/checkpoint-512/tokenizer.json filter=lfs diff=lfs merge=lfs -text +grpo_full_qwen2_5_3b_20251121_111716/checkpoint-64/tokenizer.json filter=lfs diff=lfs merge=lfs -text +grpo_full_qwen2_5_3b_20251121_111716/checkpoint-576/tokenizer.json filter=lfs diff=lfs merge=lfs -text +grpo_full_qwen2_5_3b_20251121_111716/checkpoint-640/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_miss_qwen2_5_1_5b_20251124_220354/checkpoint-896/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_miss_qwen2_5_1_5b_20251124_220354/checkpoint-960/tokenizer.json filter=lfs diff=lfs merge=lfs -text diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-320/global_step320/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/dapo_lora_lr5_20251129_222821/checkpoint-320/global_step320/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..159465d44980f43b9809653d96e4cd7fea94bdda --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-320/global_step320/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0af91fa94c1610d26324df519780960ada6a1f27e6c74457200f6f046518b7e +size 110803141 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-64/global_step64/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/dapo_lora_lr5_20251129_222821/checkpoint-64/global_step64/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a7abbd61f63d17cfc18b60f946a4b16de4b2227 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-64/global_step64/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e61d560af8f44e44ea55c365f6bda9b655b62fd537dbb8589e58c8acfdd6e2d +size 110803077 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-64/global_step64/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/dapo_lora_lr5_20251129_222821/checkpoint-64/global_step64/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5ef7deea0c422a6cb3468d59335ffa72df84115d --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-64/global_step64/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43782022f1851c42edab18d1c5f754ce3318a94c6cfd07c10589121054d43acb +size 110803141 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-704/global_step704/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/dapo_lora_lr5_20251129_222821/checkpoint-704/global_step704/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a9dd67b9f10d7d48f286246e9528d0f72b286ccd --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-704/global_step704/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f63a4cf9a2c4463735a8001cb5dbf663a82c5b8dde35de52e313a5098e3d25b +size 110803077 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-704/global_step704/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/dapo_lora_lr5_20251129_222821/checkpoint-704/global_step704/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4f5cf1c5a02200af5c574186d77d01eff439c7cf --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-704/global_step704/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9858506d5dc9b37ac0934b2c44e6478e6c90de6289e4eab46bfd23dca29e4d70 +size 110803141 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-768/global_step768/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/dapo_lora_lr5_20251129_222821/checkpoint-768/global_step768/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..43c8969b4e580c5d33d6feb01d14d2ef05054054 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-768/global_step768/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d62d43f0589d5a774cc4ba084fae39730c03afd1f6529d10822901c526a1a42 +size 110803077 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-896/global_step896/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/dapo_lora_lr5_20251129_222821/checkpoint-896/global_step896/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e1fb20f6714bf43d9b0ea9e918a8e5eedd712e4 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-896/global_step896/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46ed58d17dd28520ff467ff12f58d2d6ffc34d7f0447ca1a77dabf050c32daef +size 110803077 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-896/global_step896/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/dapo_lora_lr5_20251129_222821/checkpoint-896/global_step896/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d3dc2e38ad2f21cbb50e9d2d4254be006ac4bc94 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-896/global_step896/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b91cfcffe025fa39bd52df7ae8603e7ecad8c3cf1f02b22594f9a3cc82bdb10 +size 110803141 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-1024/global_step1024/mp_rank_00_model_states.pt b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-1024/global_step1024/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..836de861f23b9bc11c2aa8fdb2ef09af3c6bd002 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-1024/global_step1024/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae04a994c37693b00f7f962f1f211233e1d17bc520278b5f7a4958b7f6b21ab4 +size 503979621 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-256/global_step256/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-256/global_step256/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d3d646291acd10030c007a270a64a481faef8c27 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-256/global_step256/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c173f80e553c6402b63194adfa25d1ac0bd85953f8851eacf4b695efabb70c25 +size 55408773 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-384/global_step384/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-384/global_step384/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a6641a53d45a3bffdfb4c6c13fd6cfa454740720 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-384/global_step384/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:891309f12d74e579d4b2a160b4bcf4d5eb1b9e3c2eb051bce449babdd7f282e3 +size 55408773 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-384/global_step384/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-384/global_step384/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..158dbff2de6ce2ebcb491488893c1b7bbc6ae464 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-384/global_step384/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35b4acc54f285d39837fb8f3cb7babe474b62f8d0fb7ba77f2e85f6ab7559058 +size 55408837 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-384/global_step384/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-384/global_step384/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d179694fc602f84765d41897921b8e1b1028616 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-384/global_step384/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73ab8a32b47361d5715d893043ccb60c9cdce6eb03e27dc46e57df0a14eee7ae +size 55408837 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-448/global_step448/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-448/global_step448/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0ca3c8b1fa5be7743993ba612548380ef2f17e65 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-448/global_step448/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e1dcaf732a948cf7a50f302152165b5104eedfb18a70442b8a65a2166542480 +size 55408773 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-448/global_step448/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-448/global_step448/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6531912082086ef269c69f8b14065f22c67cd9dc --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-448/global_step448/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5226b106ef4399b09158f8718db0429575809b2771b751be8d1420301d4faa1c +size 55408773 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-448/global_step448/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-448/global_step448/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..08eee1cfd08d722f9f71817da07c20ece68ea469 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-448/global_step448/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:38f422db28bd7cbbf94455b7c5938c08e9dce26082688ca6f8809dde5cf96a82 +size 55408837 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-512/global_step512/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-512/global_step512/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd01ba36ad17a8d859b67694cad10af830308bcd --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-512/global_step512/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c708ac2a56999d8f95eec4c5b2d5d33ce7d73acc7286f7030deb351ebde2ad31 +size 55408773 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-512/global_step512/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-512/global_step512/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..544b4a91d28c83df3bafebbe27359c84497fb6c0 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-512/global_step512/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bcdda7b81653c64a3b84a47fbbab27e73126c01d4fed3f71f39fc1c70e04e409 +size 55408773 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-512/global_step512/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-512/global_step512/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..904cf61208b4ef24ec814e212b9922b519994136 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-512/global_step512/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f1c2ee723f342ea0e40518d97402dbb7cfdf3f7ccc7bfd569d7a05c8e52c531 +size 55408837 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-512/global_step512/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-512/global_step512/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2dcef030fe78db36064e944ac6085844e96a1bea --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-512/global_step512/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59195cba6a18b9f10b45eb779dbe7bdb9165776bd5f070345a7a0a43ad769384 +size 55408837 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-576/global_step576/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-576/global_step576/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d5c63df38c965fd1919bf3bd4918b2ddc721c29c --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-576/global_step576/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab7b90ad83442282f9e32c7ebe09e8a928bb21d66d37e7395c570ad7a05336f6 +size 55408773 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-576/global_step576/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-576/global_step576/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bcacb3818b6f970c4a35f00d2ee4343184d83aa5 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-576/global_step576/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23bdd2fc827e4743510e0a9069ea2ba2cef1f53b7aeb7c55ce1e188f471373e3 +size 55408837 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-64/global_step64/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-64/global_step64/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d26ceca191a606d7f89c263e6628d95ab046488f --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-64/global_step64/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6302e73dc96b08ce363eba908f3a38c4b12517c8e28bf6528ca133fbe579619e +size 55408773 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-64/global_step64/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-64/global_step64/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1a6117362d7eef669447159e56ab5aafb32c52c6 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-64/global_step64/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d7d899edea76ec13fad77022e08b7dc02cfb5d307607eb38cb47d38a3ece5c6 +size 55408773 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-64/global_step64/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-64/global_step64/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..42e10ac1c63bcfb780778fafcac21c9ab12ee3d4 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-64/global_step64/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d3a85565f7e407cf1e18e6c58f84583443d68f16ae89b64065eb9c96d9027af +size 55408837 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-640/global_step640/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-640/global_step640/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad075815df4d84eb0a5b4582b2581121b84b8192 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-640/global_step640/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:077819e24822d61a5ffc0643f6edfa4acee55ae1e413ce52e6e70efdb3223c92 +size 55408773 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-640/global_step640/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-640/global_step640/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..17390fdbba4eaaade6bb678d9a6b01a7e5376590 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-640/global_step640/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb9777c0e29a8b4c103c903cefe4f99dcd4494f72ebd61c5ef92cb3a0d2ec92d +size 55408773 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-640/global_step640/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-640/global_step640/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1c47f0f6648c91076e879c641aa495dbd251fe3f --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-640/global_step640/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc27fe7078af666ff592665254037ef893dfa00270077c5420e8c525c79ea515 +size 55408837 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-640/global_step640/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-640/global_step640/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4d4bfdfd761cb3bc1bfa82c64f04fc50e388ea61 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-640/global_step640/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1ea48117ae31f72542f7e44155ace0461b0a39dc2491b588da754676aab246e +size 55408837 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-704/adapter_model.safetensors b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-704/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c623af1bb11b0eeabbaa8b9f6f42a1feb5f7dccc --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-704/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45a4b54b071716e3dff2404aab252f8cfa81dbea9bcc94a255d04ad66e82ccb3 +size 36981856 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-704/global_step704/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-704/global_step704/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1513b3f5cca79b5a44fdd79b0e0eb8450f1915e1 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-704/global_step704/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f55753d8feebdac46671689cb05e1d8e48d31bde939d461ac8c70529f627023 +size 55408773 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-704/global_step704/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-704/global_step704/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d503f436418f8de98ed8bdf71ae96c7ce46d75c9 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-704/global_step704/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23aee3396d9e328d7bf9fedf9567091db8f907f6972d3300008136bf0e26d6e1 +size 55408837 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-704/global_step704/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-704/global_step704/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4cc1cff6e1f377d1e6d517ee9bf576567a37bac2 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-704/global_step704/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:716d04c8400d2b013030e40f981724b86a2425b7fa36369b7cb081f191300b87 +size 55408837 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-768/global_step768/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-768/global_step768/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..df22e1a38bddd8296c92fe75521fad8a2bb0ea53 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-768/global_step768/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7f4f5e79e23c9bf656d32fadac7a179aecbf170a85f2a284f05269f2785daa8 +size 55408773 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-768/global_step768/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-768/global_step768/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c9effaa4846f23ccf51cac78196316ec65e6897 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-768/global_step768/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27f2358fc29df07c12d7e90ad7c60b137f4fe0c980c73cac87798c81766d40d0 +size 55408773 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-768/global_step768/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-768/global_step768/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b7a0846537b89b3a52232b36774af99d25852e64 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-768/global_step768/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:096271c9237df42169929a141b5833bdaef66cde2e12e05a9ab44dc5c0f51cdf +size 55408837 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-768/global_step768/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-768/global_step768/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..753c1cc199ef295450742a5e2e070c854d704aa2 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-768/global_step768/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2de8b7503c6a435e15ab55b5b622c934c4a965859b99bc981efbc7048fcf62b +size 55408837 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-832/adapter_model.safetensors b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-832/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..55494bf38d1bccfbb7b741edbf0489930ab098aa --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-832/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eefb59c1f5dc727ebfeb008094fdc6f7f030a7acdfbe40743ed0fd322e53e2f4 +size 36981856 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-832/global_step832/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-832/global_step832/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..422f9879de46846bf6605ab814642418fe5f57f7 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-832/global_step832/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78dfe1964501784207ee53c77ba9d42420c1754407a05f140ede870bc0d561c6 +size 55408773 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-832/global_step832/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-832/global_step832/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4f97d2d0640a11d4c6011cdbb816a42afda338fa --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-832/global_step832/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fcc2bf523806805907cc8f8dd2d48095cd4e31978d5884efc96128cf22d76357 +size 55408773 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-832/global_step832/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-832/global_step832/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3862d4ef87347a2d977ec9ba19d07e13459c6cb7 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-832/global_step832/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4e83e929b8f8bd2fc20274deff9ae942bd75ecd7155e3d439917128731db6e4 +size 55408837 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-832/global_step832/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-832/global_step832/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..954bcc0f5ea2c44f9950d2a4f7ac5b4cdd29247e --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-832/global_step832/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:945b0b1cb28d1ff18336559320315ab43643ae7b2bcac986d772b63e24323d63 +size 55408837 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-896/adapter_model.safetensors b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-896/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..cc2122e5b1f50a6d966a7662a032a2cb2285f10d --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-896/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08a969dd0c97ca0262352193dd09fdd82dbc13e0692879320913fcb45ceee7f6 +size 36981856 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-896/global_step896/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-896/global_step896/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2d3b98d742ea1c940bbb881785964b0f1bd8b346 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-896/global_step896/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c13ea7f654aaea2a7400b6b97b67af7422538cd27a74da3b0a9a9572f2f1fcb4 +size 55408773 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-896/global_step896/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-896/global_step896/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..11f2a23bad8dca2eedff31dc7e490401f2b2e9be --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-896/global_step896/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c7d40c938363993b77c30a7f5e374b1f027c14b04f2842c8e72de4eaad6e541 +size 55408837 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-896/global_step896/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-896/global_step896/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..06efaf6eeedf8ea07d442c1f4948873788255fc7 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-896/global_step896/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:132b6fde99a306af9f933041db48f877de556219975ebeb800030db53647aa33 +size 55408837 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-960/global_step960/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-960/global_step960/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..20d3fadb97696e0bf6c9ca641c39f690fe3e2ada --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-960/global_step960/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dcbc8dedd1a9a23883f111254f5cfefed63c3e2e6aec0233c46317bd32aac6f3 +size 55408773 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-960/global_step960/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-960/global_step960/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ffee593b8c4a00074eabf9382ffd340be99bed6a --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-960/global_step960/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91fb7ac83b6decc36e431ab48ffdd6a577fc03072ebea1aa0198df2b631b9365 +size 55408773 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-960/global_step960/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-960/global_step960/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e07fd0a8373aa33e7e6578cf7757e413b6b5ee2c --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-960/global_step960/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5926ac5870d3bdaa700fb2db69b0cdc6f662af534dafe10d46c357408d5faf32 +size 55408837 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-960/global_step960/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-960/global_step960/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..67f8468d1311464672e4ab69548adfb8e139bddd --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-960/global_step960/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd9bb93a5b1d08c491445935d0a2888f49ff71a4d30c636bc68a422a72a628a3 +size 55408837 diff --git a/dapo_lora_qwen_1_5b/checkpoint-1024/adapter_model.safetensors b/dapo_lora_qwen_1_5b/checkpoint-1024/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..24d5ebd0d0b7b18f3347cd21d7e66e3b540c5e5e --- /dev/null +++ b/dapo_lora_qwen_1_5b/checkpoint-1024/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f165d3cfa7f10835c227107d9213783315a50a85366063fafbb8ee29f7201c5 +size 36981856 diff --git a/dapo_lora_qwen_1_5b/checkpoint-128/adapter_model.safetensors b/dapo_lora_qwen_1_5b/checkpoint-128/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7462b9b65f45e81aef1b90b391ad8cb3bb6f86cd --- /dev/null +++ b/dapo_lora_qwen_1_5b/checkpoint-128/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:584dfb41b5ef5705cac93b775ba0a0d02aeb40badf5e167632037f9496524231 +size 36981856 diff --git a/dapo_lora_qwen_1_5b/checkpoint-192/adapter_model.safetensors b/dapo_lora_qwen_1_5b/checkpoint-192/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..49d9c2c445e845f55ca8e19d6b6e26b857a1605c --- /dev/null +++ b/dapo_lora_qwen_1_5b/checkpoint-192/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ac650572647372089089e4ff64d88e428421bd36862ebcb37b515f2d5040dd5 +size 36981856 diff --git a/dapo_lora_qwen_1_5b/checkpoint-256/adapter_model.safetensors b/dapo_lora_qwen_1_5b/checkpoint-256/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a35aceaf779fbceb35fc96062db6ef324f3c5442 --- /dev/null +++ b/dapo_lora_qwen_1_5b/checkpoint-256/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:757151996c74322c9c182ce2c761f5f0876b0f84fac6100c55f0147979bc4be3 +size 36981856 diff --git a/dapo_lora_qwen_1_5b/checkpoint-320/adapter_model.safetensors b/dapo_lora_qwen_1_5b/checkpoint-320/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7f14f7a7fb35d164837f239abfbba3400ce0a94d --- /dev/null +++ b/dapo_lora_qwen_1_5b/checkpoint-320/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c060e2710423ab812d78ff6b01e2a983997a209a41ec1fb51df846e2fa79226 +size 36981856 diff --git a/dapo_lora_qwen_1_5b/checkpoint-384/adapter_model.safetensors b/dapo_lora_qwen_1_5b/checkpoint-384/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..17337ae94fd8189aac7eddbaae2108dc5cfe4e2f --- /dev/null +++ b/dapo_lora_qwen_1_5b/checkpoint-384/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:454e4c93185d14dd6373961a0eebf020cd8d49044c117e19cd6a39f08cbc690b +size 36981856 diff --git a/dapo_lora_qwen_1_5b/checkpoint-448/adapter_model.safetensors b/dapo_lora_qwen_1_5b/checkpoint-448/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3aea4d34afc9694bb941913db421ff12bcc56d92 --- /dev/null +++ b/dapo_lora_qwen_1_5b/checkpoint-448/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c07ecd999d06005b9027ca77abcd7746e741023a219e1ea730225df628355b6 +size 36981856 diff --git a/dapo_lora_qwen_1_5b/checkpoint-512/adapter_model.safetensors b/dapo_lora_qwen_1_5b/checkpoint-512/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..23d556d22a5f5e7bd087e0d8c66dd04ce30f9670 --- /dev/null +++ b/dapo_lora_qwen_1_5b/checkpoint-512/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf2af41aea7d8dc21adaf59bb85ad32a334cb5132830e23d79e7d4fcca59bf6c +size 36981856 diff --git a/dapo_lora_qwen_1_5b/checkpoint-576/adapter_model.safetensors b/dapo_lora_qwen_1_5b/checkpoint-576/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ce85768772980dfdd26daa88953de748fc389f02 --- /dev/null +++ b/dapo_lora_qwen_1_5b/checkpoint-576/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e740cd8b795487d08f5385c15b829d31a6ad5a19aa399ccc6c213e08cdf7444 +size 36981856 diff --git a/dapo_lora_qwen_1_5b/checkpoint-64/adapter_model.safetensors b/dapo_lora_qwen_1_5b/checkpoint-64/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1e0d280c8cf675408380e3027cf732d73f676bf3 --- /dev/null +++ b/dapo_lora_qwen_1_5b/checkpoint-64/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea438f7d6f69cdbf231fd76c8a12ceab53c30e37e1f9663acebf8c419a48b23e +size 36981856 diff --git a/dapo_lora_qwen_1_5b/checkpoint-640/adapter_model.safetensors b/dapo_lora_qwen_1_5b/checkpoint-640/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..60375cfbd376b0431001ffe5c84bd4d584101cf3 --- /dev/null +++ b/dapo_lora_qwen_1_5b/checkpoint-640/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a01726d2f367e26dd0fc496fb96826a6e6e104457c056f87cc55dec29a226e8a +size 36981856 diff --git a/dapo_lora_qwen_1_5b/checkpoint-704/adapter_model.safetensors b/dapo_lora_qwen_1_5b/checkpoint-704/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..53a1d60b3bbf97ebf77d8a87b5361858bc309f3f --- /dev/null +++ b/dapo_lora_qwen_1_5b/checkpoint-704/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa8cf44842c1141e6bab9baa0de5394f0ac90c9a713c49018c0150d15e1774fa +size 36981856 diff --git a/dapo_lora_qwen_1_5b/checkpoint-768/adapter_model.safetensors b/dapo_lora_qwen_1_5b/checkpoint-768/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9d6a47432e1d286ed786e51f5fb2ccf4c34a1aaa --- /dev/null +++ b/dapo_lora_qwen_1_5b/checkpoint-768/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2e31d14b45279e04aa4f38284e0a05ab01a90eaad0de33cd1cf2634f7418b9f +size 36981856 diff --git a/dapo_lora_qwen_1_5b/checkpoint-832/adapter_model.safetensors b/dapo_lora_qwen_1_5b/checkpoint-832/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d143d8042cb5df5225773f0fa14872306c2753b2 --- /dev/null +++ b/dapo_lora_qwen_1_5b/checkpoint-832/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb04f44650f7e9913e61599336a4cc4815ca528ed67cc278014b4a72e38c8693 +size 36981856 diff --git a/dapo_lora_qwen_1_5b/checkpoint-896/adapter_model.safetensors b/dapo_lora_qwen_1_5b/checkpoint-896/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0dea0fd01a9c90c65be373b8252913bd88554674 --- /dev/null +++ b/dapo_lora_qwen_1_5b/checkpoint-896/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e2fa2b5d460f4aeb41d913783a0cb6667cfba750799e391897738c62429ce3b +size 36981856 diff --git a/dapo_lora_qwen_1_5b/checkpoint-960/adapter_model.safetensors b/dapo_lora_qwen_1_5b/checkpoint-960/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..58c52b06db935e0ed11b603fee383ceebdb11c22 --- /dev/null +++ b/dapo_lora_qwen_1_5b/checkpoint-960/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3eb403abbb622ab1f58e14aa7730003833674d4a741a7f302e1bb8fc0a517690 +size 36981856 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/adapter_model.safetensors b/dapo_lora_r16_qwen2_5_3b_20251124_104900/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..24d5ebd0d0b7b18f3347cd21d7e66e3b540c5e5e --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f165d3cfa7f10835c227107d9213783315a50a85366063fafbb8ee29f7201c5 +size 36981856 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-1024/adapter_model.safetensors b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-1024/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..24d5ebd0d0b7b18f3347cd21d7e66e3b540c5e5e --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-1024/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f165d3cfa7f10835c227107d9213783315a50a85366063fafbb8ee29f7201c5 +size 36981856 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-1024/global_step1024/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-1024/global_step1024/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..772ab51d8c348d8f804aab6fccb863a6a9b53ff4 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-1024/global_step1024/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:585ce2e4eb2b7466028975caf2f42eb7a482e06fa3ac7493e0acb64096b49156 +size 55408773 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-1024/global_step1024/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-1024/global_step1024/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a6dfbac3dce1037fd7ef242cbb717b0a4e83b370 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-1024/global_step1024/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4cad3ed680d4887848bcbd632f7f8dcc1d5eac6da4c2f0aa8a07add02ce00e0 +size 55408773 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-1024/global_step1024/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-1024/global_step1024/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c0097e8f8c987b80428362268bc72a50ee5d54a7 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-1024/global_step1024/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0a45fb5ba6508fef1994873c1d175f9dcfcde74fe6405c17b4b65e04ed34a87 +size 55408837 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-1024/global_step1024/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-1024/global_step1024/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3268ff487ae7d1b6dbcef1f90f4d439ba2fcfd99 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-1024/global_step1024/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0fc512d961262cf29777727a27ff4ac64d0b187388c2cb3a4aa516d29475257e +size 55408837 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-1024/global_step1024/mp_rank_00_model_states.pt b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-1024/global_step1024/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7eb8e19a69d93d22ebf45c70d3b37b42543cde2a --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-1024/global_step1024/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4a3afb86ce95b5d1dcb4456cd2de82b80a02935c4db41aa2e9b2d5343fb17f4 +size 37231769 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-128/adapter_model.safetensors b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-128/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7462b9b65f45e81aef1b90b391ad8cb3bb6f86cd --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-128/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:584dfb41b5ef5705cac93b775ba0a0d02aeb40badf5e167632037f9496524231 +size 36981856 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-128/global_step128/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-128/global_step128/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d4beb0d1807249cdd99fbf891fffbcd8b2f6078 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-128/global_step128/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d418bf7ad993cf6c071366012c35ab5dc69052fd15313de6937d8e6987574223 +size 55408773 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-128/global_step128/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-128/global_step128/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7937e6f2c27121695a7cba28e3900b48ae2fe68b --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-128/global_step128/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:598e6c05e7d97d25a5f00e3c14990cf882ec5c006dc2b1156ba4e46179e9fcf9 +size 55408773 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-128/global_step128/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-128/global_step128/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c7272d3851134f7e981d0f4ed86827ade12cccf2 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-128/global_step128/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef74fb6b2ccf7b56ab3fae101feab1ee3fdd3fe9060e8dd1149b434e2e81b5f8 +size 55408837 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-128/global_step128/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-128/global_step128/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dfddfd1c39d0a05842137ae515116e1fdd2fc55e --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-128/global_step128/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:856625e2fdebad3ac41a120005f2b4c8d94e5af9bbebda7c322f4b48158960ef +size 55408837 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-128/global_step128/mp_rank_00_model_states.pt b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-128/global_step128/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..61968fced2f1f2b60b640748f50a358c68660192 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-128/global_step128/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4caa27ade9ffd994ebd8c4d867956a9c9b777bc5c49d14512e9680d2eac5520e +size 37231769 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-192/adapter_model.safetensors b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-192/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..49d9c2c445e845f55ca8e19d6b6e26b857a1605c --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-192/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ac650572647372089089e4ff64d88e428421bd36862ebcb37b515f2d5040dd5 +size 36981856 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-192/global_step192/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-192/global_step192/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..be1422ade5c36dabdb8418ed3e6d029073dbef06 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-192/global_step192/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab6bfd4338ac865bc1f3b31c9312f4c0f2d84ef1428a77c6b9864513cb6a3b13 +size 55408773 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-192/global_step192/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-192/global_step192/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..19b1d8982d09b0adbf587fd8932be2a429691f6f --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-192/global_step192/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:945e13a8645f397c01d09ff536672a722addd6a832450e505b9fa094fe4a531c +size 55408773 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-192/global_step192/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-192/global_step192/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..80e25285ca8ee3980c6919bd80b2d1dc4806b0fd --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-192/global_step192/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed2027744e3522c3bd35147201b0586c641d9b3491458008fb695a96b5a767ed +size 55408837 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-192/global_step192/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-192/global_step192/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4b457dfee2215c7de60c97517d99078db7424aa5 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-192/global_step192/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2ec34749753014c56e7ade38a95f5b0e4cb073a2111f117b673614315c54420 +size 55408837 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-192/global_step192/mp_rank_00_model_states.pt b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-192/global_step192/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..905c4213a69f1de38033807be3a920f92cc93f40 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-192/global_step192/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3dd60f1f2e164c158895d36dc9a0d3c133fd3e5c24dee60ebd9020b4ba648f28 +size 37231769 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-256/adapter_model.safetensors b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-256/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a35aceaf779fbceb35fc96062db6ef324f3c5442 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-256/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:757151996c74322c9c182ce2c761f5f0876b0f84fac6100c55f0147979bc4be3 +size 36981856 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-256/global_step256/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-256/global_step256/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bac99b7e560fa88f858402da79247d32ea96434a --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-256/global_step256/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31dbbdc711d869ef2f093f04bc2eb3c7a5b027800673fbbb8d8fcd25c6ed27d9 +size 55408773 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-256/global_step256/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-256/global_step256/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..be23fe154f376ef337aaf3c7b450ddc281da575b --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-256/global_step256/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14e8e2123323bd122175f20ca6690507a19a9f7b95d8d864fff281a0013e05e7 +size 55408837 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-256/tokenizer.json b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-256/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..1a2db243e47cbc113f6b2ddcc388aeeb8fe1a94c --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-256/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893 +size 11422778 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-320/adapter_model.safetensors b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-320/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7f14f7a7fb35d164837f239abfbba3400ce0a94d --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-320/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c060e2710423ab812d78ff6b01e2a983997a209a41ec1fb51df846e2fa79226 +size 36981856 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-320/global_step320/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-320/global_step320/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..93559b3dd34b0739303b4674661de1c67d02b148 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-320/global_step320/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0233cd2efc487907c49e3adb9d87a265eb6381d1c258e1448f5c2c08535c7b17 +size 55408773 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-320/global_step320/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-320/global_step320/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ce9d78c8dc87a2e36e2900ab1dfcd91f90344a0 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-320/global_step320/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c211e80d8db3b5fac2ad7baf0dd4d5788710205fe61a834a2f16ce4957339132 +size 55408837 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-320/global_step320/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-320/global_step320/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5a28d3cd086377a9e51d33964f4efa9a6f13c548 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-320/global_step320/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b939a8e745a040f4d63e4540d1fcc1bcb0935d339d3a7a9dc9f4bff3bf077a7 +size 55408837 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-320/global_step320/mp_rank_00_model_states.pt b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-320/global_step320/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3221cfe7c89e91b56f8977f841a624eb6fd52688 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-320/global_step320/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31d129f2b3f9fdd32af4e21fec9478c88f2a145826c8c0acaa723a4bcf47fb55 +size 37231769 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-320/tokenizer.json b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-320/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..1a2db243e47cbc113f6b2ddcc388aeeb8fe1a94c --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-320/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893 +size 11422778 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-320/training_args.bin b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-320/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..2a32527c071ce3323255d067df17ab72b228551e --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-320/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7cc479e21276b308c8f336b99be02d5fb11c440dea3134eaff10d6dfd8a99cb +size 8849 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-384/adapter_model.safetensors b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-384/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..17337ae94fd8189aac7eddbaae2108dc5cfe4e2f --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-384/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:454e4c93185d14dd6373961a0eebf020cd8d49044c117e19cd6a39f08cbc690b +size 36981856 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-384/global_step384/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-384/global_step384/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4f4567d355ed410b40388eb28ce1fe3b1f0eaf13 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-384/global_step384/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1dcddc7cd750f2f6c80c540d3b65a8cc37e1b685150191a7244a80924588400b +size 55408773 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-384/global_step384/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-384/global_step384/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0942a84648652b9df8796ad568507d1aa365b380 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-384/global_step384/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea3377b03f11b6cd1bf2c5215b2d6be0b5a63d6307cba37cda72a738a8ce14f7 +size 55408837 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-384/global_step384/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-384/global_step384/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5fa88fa14c04fdd58ec742e4159883fcfa676d1f --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-384/global_step384/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b211cb4e540eceda2f6e64fbba936653ed292c63dbc61fbf724cc103e4f7b657 +size 55408837 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-384/rng_state_0.pth b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-384/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..2a548cd34674bdfdd4a306af0c882d3b021bcd81 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-384/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:045ee30efb3989babdc3f0e74bf7daa60a6708f1fbb35ccbebb48db9eaf90d7e +size 15365 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-384/rng_state_3.pth b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-384/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..b8375a19b3ac03b6097e5e00fbc3e9f0a0b6c569 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-384/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7f9611ad75f003f58b2d88b032d89d95273ec8a87de1380811b110ed81f708c +size 15429 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-384/scheduler.pt b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-384/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..e35447364346dd4e48ff2912c9630fa0d550dd81 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-384/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a73b3132edc693a316dd18b0560b36c0fb0501d1030453a31a1309122a6bf7c +size 1465 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-384/tokenizer.json b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-384/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..1a2db243e47cbc113f6b2ddcc388aeeb8fe1a94c --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-384/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893 +size 11422778 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-384/training_args.bin b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-384/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..2a32527c071ce3323255d067df17ab72b228551e --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-384/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7cc479e21276b308c8f336b99be02d5fb11c440dea3134eaff10d6dfd8a99cb +size 8849 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-448/adapter_model.safetensors b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-448/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3aea4d34afc9694bb941913db421ff12bcc56d92 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-448/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c07ecd999d06005b9027ca77abcd7746e741023a219e1ea730225df628355b6 +size 36981856 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-448/global_step448/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-448/global_step448/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ab5816155f34b54ef3696d7564078c57781734f0 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-448/global_step448/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6626be104b574f0fdc414a3446b1586a7a463d95f03aab12cb5258113fa10451 +size 55408837 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-448/global_step448/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-448/global_step448/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f03476899b37ecf218012f9d6ef3809fe6de653d --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-448/global_step448/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c181715206688a576eb376ee807c511a2e6b2a2316d5388ffd5ef78f8deb239 +size 55408837 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-448/global_step448/mp_rank_00_model_states.pt b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-448/global_step448/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..230dd5297802a8a9afa75a84c6459c3fec5e4493 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-448/global_step448/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:773fd8757a257479c0c10e5c1bcd5011fb4294941f1557fd861f203fc54c5556 +size 37231769 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-448/rng_state_0.pth b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-448/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..e761e5b2c14cf63ecaca7f084f005eae192e2efb --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-448/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8c5f2f9a417c333096134ba70c759cb0e56c26c8c0cc5275548d587ba111549 +size 15365 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-448/rng_state_1.pth b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-448/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..c8eac1a2219024db1fd61dfa68857a99bc731bd7 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-448/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:396587da7f0884630c2e7d0db56488d33218b3d31d533572cdc0fe5124169624 +size 15429 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-448/rng_state_2.pth b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-448/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..d26a88f9adc8cade3b472ed5a4822f68b6938d2f --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-448/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aacfe84db7de450c69922dee352a27efafbf3deeeb378c4c84e820760bbc6779 +size 15429 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-448/rng_state_3.pth b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-448/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..2653289d6a64edd03bdb1055c09216b0d9e5a41a --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-448/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46533456048004d3705d1a4dc9356930e3ecb30f9fcbb20eb628619943743e67 +size 15429 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-448/scheduler.pt b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-448/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a39d5aae7a5de28bbf7c8e26531da9f7f0cda3e --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-448/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89d50e6c2130ded251cbd3fb239e3a2e1e0564766292c69bfb4aa6ba0d973844 +size 1465 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-448/tokenizer.json b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-448/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..1a2db243e47cbc113f6b2ddcc388aeeb8fe1a94c --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-448/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893 +size 11422778 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-448/training_args.bin b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-448/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..2a32527c071ce3323255d067df17ab72b228551e --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-448/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7cc479e21276b308c8f336b99be02d5fb11c440dea3134eaff10d6dfd8a99cb +size 8849 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-512/adapter_model.safetensors b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-512/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..23d556d22a5f5e7bd087e0d8c66dd04ce30f9670 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-512/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf2af41aea7d8dc21adaf59bb85ad32a334cb5132830e23d79e7d4fcca59bf6c +size 36981856 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-512/global_step512/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-512/global_step512/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bef9c403efae33631167eecb72c86face4e0318d --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-512/global_step512/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fcc651f82d88fbb1cb7e82eb8a09cc0fee0245a293ec83d5f75b160851831405 +size 55408773 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-512/global_step512/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-512/global_step512/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5054cac96c7ca9d5312ba8f971c375213e3548bb --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-512/global_step512/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d83fa881e0db4f1ef02a4204a2a8bd109d3525f0ae38d66e4f3f001153b7653a +size 55408773 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-512/global_step512/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-512/global_step512/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..36c56b4d54f7890fc1c63efcb82583d790d7866d --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-512/global_step512/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8e106187026c40b6b0cc23eb7ae1b9d5691e1dd678cdeeb7bbb7826a47fdfd7 +size 55408837 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-512/global_step512/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-512/global_step512/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ec43fc4978f1bc822b67a70e00d97192bc7650c --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-512/global_step512/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0981e26d00345d4439d20e70c400305902c42b4af10a0b72d177139cfc67acda +size 55408837 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-512/rng_state_0.pth b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-512/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..f8945a38432f36fe039afef9c75669a32260b9ab --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-512/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8990cba736594bdfd464fa36bdafad2f0f32fb1b2597ad12449273a4d5f02b85 +size 15365 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-512/rng_state_1.pth b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-512/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..7205f6ccf45cc411589df0fb15421de6eeddd109 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-512/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0806ddaf6c443fd7c7dff172b5ecca0577e847bbebada0cdf4c5edfa159a3aaa +size 15429 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-512/rng_state_2.pth b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-512/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..90ebd789fd9b96737df992eca7b9c26da3022821 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-512/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f2cf9d7623d57213896c4c6942f7590b2cec7b5dbd0f7fa4169f0ecbfc05497 +size 15429 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-512/rng_state_3.pth b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-512/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..cf83c4e5066bada10ccd0027dc43398efd94e96a --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-512/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd6720c03f759c8d68132f22dce2bbda4b9ca519abb3c03bd000cf13ca63792a +size 15429 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-512/scheduler.pt b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-512/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..4800a9e5803399b265ffcab0af9c3fe980dbd948 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-512/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c0e61c4f166edd4bd232bd6fbefe6d67a5b7e00cb803d1741eac9a6d2b7b6ee +size 1465 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-512/tokenizer.json b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-512/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..1a2db243e47cbc113f6b2ddcc388aeeb8fe1a94c --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-512/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893 +size 11422778 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-512/training_args.bin b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-512/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..2a32527c071ce3323255d067df17ab72b228551e --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-512/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7cc479e21276b308c8f336b99be02d5fb11c440dea3134eaff10d6dfd8a99cb +size 8849 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-576/adapter_model.safetensors b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-576/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ce85768772980dfdd26daa88953de748fc389f02 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-576/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e740cd8b795487d08f5385c15b829d31a6ad5a19aa399ccc6c213e08cdf7444 +size 36981856 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-576/global_step576/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-576/global_step576/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d40c4b3ff6a5224a0c390d0d78e0b4d86b6a24ad --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-576/global_step576/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:00b2919b32cd6c33ee7df40d7587b37c8e18ebddd654bb1521d69a6c4e016cd3 +size 55408773 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-576/global_step576/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-576/global_step576/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..29ba33d9a993107e1f3283df41a1a76e857db702 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-576/global_step576/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71088e25cad99374821e35b0427a91f035627f7b287778af4f03231078d36804 +size 55408773 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-576/global_step576/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-576/global_step576/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3d132d4a9de8c104d8eae52ca84305359d53b84e --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-576/global_step576/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e39ab7c73474c9090c957638f003e81b0cd336443649f5f1903e29a44db36212 +size 55408837 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-576/global_step576/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-576/global_step576/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c8e5095ebddd318fe6e59da45066c566abdb2d0 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-576/global_step576/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9869863b6055f183c4035e375179772a4a2795e2901c6acee594666a8fdd815b +size 55408837 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-576/rng_state_0.pth b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-576/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..0d91c9c3e0da3c13905603c5f2ae76558ad39bcd --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-576/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc85d41d7b96c21cd206e0928236338add8570f11c4205e257da173a358f5b2b +size 15365 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-576/rng_state_1.pth b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-576/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..94f3aa8120e7fde8c71ef3bc4b938ca26e672f6c --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-576/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:380357016cf9a81b0a9c75b07bcc7951be40b13b2cc49a3410b31d67d284eff2 +size 15429 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-576/rng_state_3.pth b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-576/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..ebd627e10f9d1d47555ffdd849c8bbaa4b50fb0b --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-576/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5b92574bb6f883c66da3c447012c2c939869c2c2cfb2e91d118821012d3490d +size 15429 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-576/scheduler.pt b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-576/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..454813a4990df191f6951cdef743cc653ff31f83 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-576/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:105f4404298e62d6811a76a80078eaf19c435d835ba8926a324f78dfdc9fb5f1 +size 1465 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-576/tokenizer.json b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-576/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..1a2db243e47cbc113f6b2ddcc388aeeb8fe1a94c --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-576/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893 +size 11422778 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-64/adapter_model.safetensors b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-64/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1e0d280c8cf675408380e3027cf732d73f676bf3 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-64/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea438f7d6f69cdbf231fd76c8a12ceab53c30e37e1f9663acebf8c419a48b23e +size 36981856 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-64/global_step64/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-64/global_step64/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e281c5aa7d3e152c009f3c06f22118a2334a8b35 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-64/global_step64/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64705dd746312538dec8a7c36b0c6ff49ac87bafe15bacf76c8ed77c6ce8a8b8 +size 55408773 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-64/global_step64/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-64/global_step64/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..18847e1a08c2232c24fbe23c4a234f613ad41581 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-64/global_step64/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9a3d45a86cf101b82e19bdd5dd11ebdd9c27bd3c03cb473dd620d512b80e960 +size 55408773 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-64/global_step64/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-64/global_step64/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..57b2ebb58c72e2e19c158f1c42ff84bb9043e0ec --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-64/global_step64/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9155dcacad7245d2d4ef096a98d6eb30adecbceaf024b17710c3870010b60db9 +size 55408837 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-64/global_step64/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-64/global_step64/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..058ee881c80af69a431d2c20b41e598fbd724503 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-64/global_step64/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d59688a9f69c31779fcecabeef0a6660672e8dfd9c8059c399186379d6221a8f +size 55408837 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-64/global_step64/mp_rank_00_model_states.pt b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-64/global_step64/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..05d9401bc746a792b12f51d6a2da7ddf485e553f --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-64/global_step64/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:014f6f74b8bba716df678b7c240bd95c32ec42038fb1e0965ddf49548d093d10 +size 37231769 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-64/rng_state_0.pth b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-64/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..68db7bc2f8d0eb93a363079e3287390cf628019a --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-64/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e426f1aa56a6164c9ea142be8d4c214774f60f67ab7bc6483d63b211ec06d38 +size 15365 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-64/scheduler.pt b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-64/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..5f18e6fbca95d9546e2f67129f5c8f7ba7da9e16 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-64/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93cefd10607223128e502b13dda034a13939769cee1c2b5c47751dc1ef0425c6 +size 1465 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-64/training_args.bin b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-64/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..2a32527c071ce3323255d067df17ab72b228551e --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-64/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7cc479e21276b308c8f336b99be02d5fb11c440dea3134eaff10d6dfd8a99cb +size 8849 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-640/global_step640/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-640/global_step640/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..340fa386e2ecb7a912855c77e6b0cd090d42a7e6 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-640/global_step640/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e452476424faf0ed523039c8e7b5be44d9dd9d38a9a13468275cb7f497012f29 +size 55408773 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-640/global_step640/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-640/global_step640/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ab01b3c9f45089e8ae106735a0308ce4d0ee9105 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-640/global_step640/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:726de101cf53856234e7968ce22fdf88c7c60fb7ebb932b6a72816a15879e0a6 +size 55408773 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-640/global_step640/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-640/global_step640/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9cd29c557d43b243273bdd3ca472c2d6bc0b4a90 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-640/global_step640/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aadc4e10094511c9effc77c95c50ce93c269349266697310c148c202b05e8895 +size 55408837 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-640/global_step640/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-640/global_step640/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7fa0158954dc5a95c5a4e171e0301b664ff0dc5a --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-640/global_step640/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06c7673d59ccbb5091ec21800fecf48bf69b99d84457a459c89c93d0928d923a +size 55408837 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-640/rng_state_1.pth b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-640/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..9b149a6d013d0e6c434408d596de9c60411068e4 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-640/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6fa4fc3fdc2dcfe11961f73c09c8bbc12170d988705db126e9d767976ce6abc1 +size 15429 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-640/rng_state_2.pth b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-640/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..702b90f537421f7a418fa7100d3de4b5d4c4ed94 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-640/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9bf558c1fbd5ceff986491c896ffa5d8250fe0be9d2eea7e2e1abb8a7ed85bbe +size 15429 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-640/rng_state_3.pth b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-640/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..3579a65df68098ea24893eaa9111354891a0eb54 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-640/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc8f54700f00554627d69171b04d1e7cfd31a2a329fdb8f60ed35a50c271ce78 +size 15429 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-640/scheduler.pt b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-640/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce72654f572f2506f27160b816a295cb0b390c16 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-640/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a218931437f4ccf43b090350bb40ee3df136a61635dc16c5ca38673a829c2bdb +size 1465 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-640/training_args.bin b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-640/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..2a32527c071ce3323255d067df17ab72b228551e --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-640/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7cc479e21276b308c8f336b99be02d5fb11c440dea3134eaff10d6dfd8a99cb +size 8849 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-704/global_step704/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-704/global_step704/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f2fc6342cedca0362a1507d8af6283e2ea27bc7c --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-704/global_step704/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c324177b50d7273c9ccc365b00d2b7acc8c28770d4c18d25a323f95b22aa230 +size 55408773 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-704/global_step704/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-704/global_step704/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb502d805784412045160b0c30fd0f0fb106cd8d --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-704/global_step704/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8153e2730b6d501d2e2b26f66460665b5590d76f6a8dbca3216f233f0a117462 +size 55408773 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-704/global_step704/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-704/global_step704/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f919436ef034fb440eb879f0b19a52bc42e6f47e --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-704/global_step704/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1b8fde2bff0afcce9b007af5d592f7c01528ae7096cfb072fb834d0a598e283 +size 55408837 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-704/global_step704/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-704/global_step704/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..834053b0c05598c39fae210abf8291b9db67c2f7 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-704/global_step704/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4292ffb33cd7d1b80ddc7c949d844a5bc1924a95e58a052b11d024cb3d1f5ded +size 55408837 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-704/global_step704/mp_rank_00_model_states.pt b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-704/global_step704/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..62d3ff5674f174fb6f3d750fc5376c6484ab9e8a --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-704/global_step704/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4208b6cbc76742ba416924eaf6fdcc861809b1175966b303f8fb96221b70f6c9 +size 37231769 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-704/rng_state_0.pth b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-704/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..a0ac01ed67f132df1feb2ffe56af6b922ceec7a6 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-704/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5907223fcfd4dfcd506af142c75bed7bc0cb187598f91e46edf77dbb6be78465 +size 15365 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-704/rng_state_3.pth b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-704/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..bdac65e1c6b25ffd6bf27792db7d013ce61c05cd --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-704/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8285abe7684d6217c5642d8fa9d321152025bb0739b164e9337851dc953a4a3b +size 15429 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-704/scheduler.pt b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-704/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..fed940bed83776fee227b5936c168e6282b54594 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-704/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11998cc5f35748b7722fb0b2c7a077a4a3e3b00ac72b4ef20efa3259e7892c63 +size 1465 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-768/adapter_model.safetensors b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-768/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9d6a47432e1d286ed786e51f5fb2ccf4c34a1aaa --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-768/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2e31d14b45279e04aa4f38284e0a05ab01a90eaad0de33cd1cf2634f7418b9f +size 36981856 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-768/global_step768/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-768/global_step768/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..974de3c96a2b49a47e1babfb7bae3d97f1933282 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-768/global_step768/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:022e29e248df19c2f4db4c498d9e231c6d0174120f032699972b22d91448bf86 +size 55408773 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-768/global_step768/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-768/global_step768/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1a5fd89871e608ed541e2bf3ffd244e2636392fc --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-768/global_step768/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0920a9f829010e738bfbb3f0a2e04bfd96273157e49024c6df22c2091a21c60f +size 55408773 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-768/global_step768/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-768/global_step768/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d9477e4ca5657a13657235254cd748d4834c97a --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-768/global_step768/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:855f4ae8c5b9372c3295900233aa4dd3bf2f53ffb72d83c67af737335dc8e59e +size 55408837 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-768/global_step768/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-768/global_step768/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4deab20de9356b2210d58d2276016f67c341436e --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-768/global_step768/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf798145e2832cc8b4a33a705d54554fcc2eb807794523b7214320dab69a97e2 +size 55408837 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-768/global_step768/mp_rank_00_model_states.pt b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-768/global_step768/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6f4b103549720845a27670e7840b9046e90d550f --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-768/global_step768/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d284fed69ad56f8dee4ac634a7b6928db93115bbb4cc1ca5b265fba052e3fee1 +size 37231769 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-768/rng_state_1.pth b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-768/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..a6ff147ac52dd250e32c1555090ab4c04c4050f4 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-768/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8174f8c71c0b28cd2acbb4b2488dcb34fdf9a59f132817a2a5a83dcdc7b2e0ab +size 15429 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-768/training_args.bin b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-768/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..2a32527c071ce3323255d067df17ab72b228551e --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-768/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7cc479e21276b308c8f336b99be02d5fb11c440dea3134eaff10d6dfd8a99cb +size 8849 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-832/adapter_model.safetensors b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-832/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d143d8042cb5df5225773f0fa14872306c2753b2 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-832/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb04f44650f7e9913e61599336a4cc4815ca528ed67cc278014b4a72e38c8693 +size 36981856 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-832/global_step832/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-832/global_step832/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..42c901891466cde9500028fe39074dae0935e941 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-832/global_step832/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:57df652c0d73f63af98f721c8f4b03784b7fcdc991ec83d6551539cedd1e42d1 +size 55408773 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-832/global_step832/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-832/global_step832/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..135635caebc22acb4a78356d08d9b4636718f886 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-832/global_step832/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c4e8c4febdc7a143d8ea939c34aac58e710dfe33c023fb2fc8c91942d7d8a0d +size 55408773 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-832/global_step832/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-832/global_step832/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1184ad1b3e3b73abb1dc5fe1400cee4400d3ed94 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-832/global_step832/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1e0ce4fe51c9b90380ddf35922ee448d399f2b5aaf83fd568441fc24a36ddd0 +size 55408837 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-832/global_step832/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-832/global_step832/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e0a03cfcfca15a4bdadf3ea501cd14e1ec270ff1 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-832/global_step832/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4bee9022aef370853cbeb37d1c1a4fcd6ba68e07f7828f6dd5c19d172c5fb0c +size 55408837 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-832/global_step832/mp_rank_00_model_states.pt b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-832/global_step832/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f04ad9e1194738888d103cb9665cf3724d662280 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-832/global_step832/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90a3fc8889841067cb4c62616a06be4ef8e06f8e88a6135b375a2b484896dbb6 +size 37231769 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-896/adapter_model.safetensors b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-896/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0dea0fd01a9c90c65be373b8252913bd88554674 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-896/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e2fa2b5d460f4aeb41d913783a0cb6667cfba750799e391897738c62429ce3b +size 36981856 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-896/global_step896/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-896/global_step896/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bca24bddbe57448285a066b4cb1c9606fd03bf06 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-896/global_step896/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9b4323e4d405732f06245b1ae2350782d6806c1d674f65f8de1b3343af2366e +size 55408773 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-896/global_step896/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-896/global_step896/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bcd27ac6fd04f9197a2a7c9344f78a928b33b963 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-896/global_step896/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:482cc52567a8c06992bbe15e505adf15ef30e5a0ddab11d6f2838716e776b52a +size 55408773 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-896/global_step896/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-896/global_step896/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3daeaa46a622dce5ed80e194196f0e124fceb0ae --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-896/global_step896/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76dc2afa05a52f854623dc4096e572093dadd1920aa5475207ec008847484734 +size 55408837 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-896/global_step896/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-896/global_step896/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..86c9665e78a8896b218db5f87a74c2933c4e56c3 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-896/global_step896/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55ce9788669ee4207d0ca54f6fc22a33f5a8b5849a98c3cd07b243f6ac225887 +size 55408837 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-896/global_step896/mp_rank_00_model_states.pt b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-896/global_step896/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef8dc8d635ba46156fd1687837efbf1efd02025d --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-896/global_step896/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f236b983f1abdf512ccfec79a71a2084d982d286b0510351b7f012be084dce0d +size 37231769 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-896/tokenizer.json b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-896/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..1a2db243e47cbc113f6b2ddcc388aeeb8fe1a94c --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-896/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893 +size 11422778 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-960/adapter_model.safetensors b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-960/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..58c52b06db935e0ed11b603fee383ceebdb11c22 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-960/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3eb403abbb622ab1f58e14aa7730003833674d4a741a7f302e1bb8fc0a517690 +size 36981856 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-960/global_step960/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-960/global_step960/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c279f841b3a5958418b2ba6775c3cdab09da9494 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-960/global_step960/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1075449cbf204901ba9b3a3ad9eaa490442632e1150f5ca353966c8065b6da7 +size 55408773 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-960/global_step960/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-960/global_step960/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f876aa45b5ba31141dd260c8a2d4e00fe346ce25 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-960/global_step960/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22d6f06c62d5e163e6d1532e97221acd892b25ed9bd98bf8a8d62ff32f4e2fa8 +size 55408773 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-960/global_step960/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-960/global_step960/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d9c44246b3a99cd9eee45ca9d4f3775abdcf5cf --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-960/global_step960/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:756d63c3186e4c07179ce7a6439b836b8e9cd31646eaeb6ef0f7daccc9f8d1b1 +size 55408837 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-960/global_step960/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-960/global_step960/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a123c03e68734d8f115a1bfe580e691fe12d09aa --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-960/global_step960/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a866cb0b89305c20a1805daa3ba1ae238cf1fb42270f9487a2cfae471eeab26f +size 55408837 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-960/global_step960/mp_rank_00_model_states.pt b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-960/global_step960/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce9b39947fe617be6066150c320cb1528da4d8e3 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-960/global_step960/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:627b8f221c6fae27d81bb4a4af76763ce300b9823cfd5a7c2b4d15acaf09237c +size 37231769 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-960/tokenizer.json b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-960/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..1a2db243e47cbc113f6b2ddcc388aeeb8fe1a94c --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-960/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893 +size 11422778 diff --git a/dapo_lora_r8_20251129_135342/adapter_model.safetensors b/dapo_lora_r8_20251129_135342/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b97745a64064bf3413079707a918a741405394b7 --- /dev/null +++ b/dapo_lora_r8_20251129_135342/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa332ee2a45205c4a43fc859acd27147409d77c3a48ec56ba15eeb94b25da87e +size 18516456 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-1024/adapter_model.safetensors b/dapo_lora_r8_20251129_135342/checkpoint-1024/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b97745a64064bf3413079707a918a741405394b7 --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-1024/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa332ee2a45205c4a43fc859acd27147409d77c3a48ec56ba15eeb94b25da87e +size 18516456 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-1024/global_step1024/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/dapo_lora_r8_20251129_135342/checkpoint-1024/global_step1024/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a098c77cbfa94061851075e524c574579a620cf --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-1024/global_step1024/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3027328c89c5f77c179c8977d5fa82049231f49cb6ad947623d4b6b7e667bc8 +size 27711557 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-1024/global_step1024/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/dapo_lora_r8_20251129_135342/checkpoint-1024/global_step1024/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..799a249d4d1fabd9c649fc821c866987afc1ead7 --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-1024/global_step1024/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c95d4abe247f02a535198c798f7efd311cfe784c56703e7d893b68bd9f62fb7 +size 27711621 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-1024/global_step1024/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/dapo_lora_r8_20251129_135342/checkpoint-1024/global_step1024/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c3e389e51619e5754d9df22503c422fd4a11a8be --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-1024/global_step1024/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2fbdc30b28e2d32d8cbbd49ad2d7dba4bb6dd4c0697fb827aa0235fe99165b4b +size 27711685 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-1024/global_step1024/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/dapo_lora_r8_20251129_135342/checkpoint-1024/global_step1024/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..87897fd1c5effed91226b0da87773542f0925ff7 --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-1024/global_step1024/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3eec6d5caa1749e17b2a7990e28ec12824b9134da0dcd46dd702dea896bfd1b5 +size 27711685 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-1024/global_step1024/mp_rank_00_model_states.pt b/dapo_lora_r8_20251129_135342/checkpoint-1024/global_step1024/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0bf87da189705590722de459d67e9372483d6789 --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-1024/global_step1024/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d391ca0e1ee902a87a6e51af73e157fd4684e7a92710c1b8f6ec3dc33891dccb +size 18767001 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-1024/tokenizer.json b/dapo_lora_r8_20251129_135342/checkpoint-1024/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..1a2db243e47cbc113f6b2ddcc388aeeb8fe1a94c --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-1024/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893 +size 11422778 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-128/adapter_model.safetensors b/dapo_lora_r8_20251129_135342/checkpoint-128/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d10d8d5d1750f575ecbd47cdc8bb5a51aa1cf8a2 --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-128/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8c79a19bf2ba0f1e7bb03e42b2079f6a1924de264338d092c5cb6ae587254c2 +size 18516456 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-128/global_step128/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/dapo_lora_r8_20251129_135342/checkpoint-128/global_step128/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..686bce174bf93d03622adbc046639cc15126c0a4 --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-128/global_step128/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9119cc16d1b3ed76565d1df9f515ff7f3c2fc9e0512cd8ebe4502090c9ef7411 +size 27711557 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-128/global_step128/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/dapo_lora_r8_20251129_135342/checkpoint-128/global_step128/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0db1c9960bcb895cfdcdf2f1ec0b9a1a0138aab6 --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-128/global_step128/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d40616b46ca37de28896c16e31eb2528fd774aabb5c952b3e7627bc3e3017f50 +size 27711621 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-128/global_step128/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/dapo_lora_r8_20251129_135342/checkpoint-128/global_step128/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..750a94f3acdeca19bff9ae2712e54294d878e18e --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-128/global_step128/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:214797b84ca4ace0a375ed4a1bedd935d77f054dbe709223263663f5bf29f283 +size 27711685 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-128/global_step128/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/dapo_lora_r8_20251129_135342/checkpoint-128/global_step128/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a59e1a3a97aef8e68d8c26c4287663c41ffe63ca --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-128/global_step128/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7bda950eadc4f32ba2dada0048bf18856017075eaf7f59ca6ef331435767121a +size 27711685 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-128/global_step128/mp_rank_00_model_states.pt b/dapo_lora_r8_20251129_135342/checkpoint-128/global_step128/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..df37a298a6304ef22296c9b3f798ecfe5d67c437 --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-128/global_step128/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f11885b11a755df83463c480d660c179e9568cf953ce89e7528f6106cfb8594a +size 18767001 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-128/tokenizer.json b/dapo_lora_r8_20251129_135342/checkpoint-128/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..1a2db243e47cbc113f6b2ddcc388aeeb8fe1a94c --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-128/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893 +size 11422778 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-192/adapter_model.safetensors b/dapo_lora_r8_20251129_135342/checkpoint-192/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6f9d18a1b4892e3a7eb259391bd8dfa88b56572e --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-192/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c068e2c28f09aeac695ddee6ced258c5003781de3ba30d8b0496d1f07f95078 +size 18516456 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-192/global_step192/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/dapo_lora_r8_20251129_135342/checkpoint-192/global_step192/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a0a689769aaa3ad2461a15264fb28197b3917c65 --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-192/global_step192/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0da82ddde07d7fc582ac6b449ac0b286b9ce14e0a0d0530a062665c7ee8c9fa +size 27711557 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-192/global_step192/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/dapo_lora_r8_20251129_135342/checkpoint-192/global_step192/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..efe6310c4f538b83d0f38481cf965212be037e7c --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-192/global_step192/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fde0cc9d408057ecb6a65fc15b4fb4fa46d42b0ae75427c3b55913b1d3506d47 +size 27711621 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-192/global_step192/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/dapo_lora_r8_20251129_135342/checkpoint-192/global_step192/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..57f86c36166049ee269b6deca8d40964c856068e --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-192/global_step192/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e127b3491ba53e8b4aa53ac1c8944da5882982f42ba62071abf9dad742ca68c8 +size 27711685 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-192/global_step192/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/dapo_lora_r8_20251129_135342/checkpoint-192/global_step192/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3df0d452bc4ae52784cd70c48fd5be4fecb3e30d --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-192/global_step192/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e79a93e6746d9f957608950f9ac2e4771f50dac0ab57133d67ab70b50ff5fd4 +size 27711685 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-192/global_step192/mp_rank_00_model_states.pt b/dapo_lora_r8_20251129_135342/checkpoint-192/global_step192/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..88d1bd6a1ee16b908d1673094591f6f70e642db7 --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-192/global_step192/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e8fd50f11416c945c4c2947c65b0d0b62e1a82f96ec16db4caae317d1397db7 +size 18767001 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-192/tokenizer.json b/dapo_lora_r8_20251129_135342/checkpoint-192/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..1a2db243e47cbc113f6b2ddcc388aeeb8fe1a94c --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-192/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893 +size 11422778 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-256/adapter_model.safetensors b/dapo_lora_r8_20251129_135342/checkpoint-256/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a94da784752ccc267578b8d9de384fc23eb99689 --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-256/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40e6bfc152aac044550f7dc0afd8bb02a275dc0e7e8e0d58bd050d2b1f073ef2 +size 18516456 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-256/global_step256/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/dapo_lora_r8_20251129_135342/checkpoint-256/global_step256/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a07735723dfadf8f379e58d03c5e9d72d03f1b7c --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-256/global_step256/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8fee17d12f4c18ad4d50f5c551ecd1211304dd65d1fb0595f2cd8f2afb309c37 +size 27711557 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-256/global_step256/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/dapo_lora_r8_20251129_135342/checkpoint-256/global_step256/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aafad94512286f4baa7da7006d8e353cd32742b1 --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-256/global_step256/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9aa6f28ef100e79b64a48a41d3a95a5c40a5cee2b088e6dc0f92a69f72d7bea2 +size 27711621 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-256/global_step256/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/dapo_lora_r8_20251129_135342/checkpoint-256/global_step256/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..824c24e9cda25b4e0efa65648bc040ddb2c88f7a --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-256/global_step256/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d949a7cae8281308d2141365f152cedba3688f941a5597a860f8c01d1855c283 +size 27711685 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-256/global_step256/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/dapo_lora_r8_20251129_135342/checkpoint-256/global_step256/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6732bc75622f1c53f65b6a4e6cc3d952fcbe0b94 --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-256/global_step256/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc6aaf0d03cb92bc6b2361d11dbcf400f643cd1e3f95c01d65d50819b3c5d7c2 +size 27711685 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-256/global_step256/mp_rank_00_model_states.pt b/dapo_lora_r8_20251129_135342/checkpoint-256/global_step256/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ebbe4405ab5aea03d1a5975127f44f5e90811eac --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-256/global_step256/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:905b42034807beed0621c2417f15e4934b2c39cd1828ee9c30e460da5788644b +size 18767001 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-256/tokenizer.json b/dapo_lora_r8_20251129_135342/checkpoint-256/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..1a2db243e47cbc113f6b2ddcc388aeeb8fe1a94c --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-256/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893 +size 11422778 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-320/adapter_model.safetensors b/dapo_lora_r8_20251129_135342/checkpoint-320/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8094006dc49fc86054ba27dce09a8b3e3421c24f --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-320/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f2aac9436d2ce7a9c53b12cb5d10087a897eb7ffa9017465e2300f433d0b5a2 +size 18516456 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-320/global_step320/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/dapo_lora_r8_20251129_135342/checkpoint-320/global_step320/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a38b838695e97786f6f4a2b3aa161d7a08de7181 --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-320/global_step320/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:faa3b379913f973ca53d20d0b14a73c016e35083d9692c266fbdde99e13c264c +size 27711557 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-320/global_step320/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/dapo_lora_r8_20251129_135342/checkpoint-320/global_step320/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d8f67fb9ebc062df05117ad1352f63363eb5da5d --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-320/global_step320/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13cf79441a50e63be97ee31f3978f699406223084e5790e565551154ffa74c11 +size 27711621 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-320/global_step320/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/dapo_lora_r8_20251129_135342/checkpoint-320/global_step320/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b4eb0b8fd5bc7e0d26cf9b9c2e3ff65711bb944c --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-320/global_step320/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e64b708753b5e3e846b7183fa4d0c9cca555f47cac418e549b88aba09f80894 +size 27711685 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-320/global_step320/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/dapo_lora_r8_20251129_135342/checkpoint-320/global_step320/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1a481fff2d2e6c1468ecc986eb70841f16ca3812 --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-320/global_step320/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:515aad4e96dfa0905cfba39c812444118fa7b8acb7f968fc45bb3cbdb609c7bf +size 27711685 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-320/global_step320/mp_rank_00_model_states.pt b/dapo_lora_r8_20251129_135342/checkpoint-320/global_step320/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ed9702dba4a1f674abecf03490efe6e168f204d --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-320/global_step320/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa9004b2f7c61887aaec5b04f14f248d82a4da4f370dc63dfbb64d4626e2f764 +size 18767001 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-320/tokenizer.json b/dapo_lora_r8_20251129_135342/checkpoint-320/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..1a2db243e47cbc113f6b2ddcc388aeeb8fe1a94c --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-320/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893 +size 11422778 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-384/adapter_model.safetensors b/dapo_lora_r8_20251129_135342/checkpoint-384/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6d6cb040d15e0450f2059a2f605f88ef61e51747 --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-384/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e975b9be153d9dd1b9c09222e4cd91b2908589be7f4a81aad63e74a2fb3972b0 +size 18516456 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-384/global_step384/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/dapo_lora_r8_20251129_135342/checkpoint-384/global_step384/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1dd504706c4c7ef578c2031446c991c7ff6a95d6 --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-384/global_step384/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f25ea8e9e17659b019ffffa33f35738978c0f6168f74183427633f2cb160220f +size 27711557 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-384/global_step384/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/dapo_lora_r8_20251129_135342/checkpoint-384/global_step384/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6879740edc76b1a1202081025b574fc23e0a180a --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-384/global_step384/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa0780724eb9a9c2b43c1c0ddb580766c2b827f98a5c67c7af6fa48f09bae741 +size 27711621 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-384/global_step384/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/dapo_lora_r8_20251129_135342/checkpoint-384/global_step384/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2160e2811b744157ca3631f675d428615169a941 --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-384/global_step384/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53c5223f9d47fa6565a96efb8cf15931f7d1cf433eb3ba229376211ec6560fc6 +size 27711685 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-384/global_step384/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/dapo_lora_r8_20251129_135342/checkpoint-384/global_step384/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5f920be339d25d77ea606f66b3d8d763d3bd2c86 --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-384/global_step384/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd7931a7fb04ef5d12dc5c8b1ebfb1d672916e35de8b5b759030256a633adfdc +size 27711685 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-384/global_step384/mp_rank_00_model_states.pt b/dapo_lora_r8_20251129_135342/checkpoint-384/global_step384/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6743a7964da137d72fc1d02f0975efb6a07d8423 --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-384/global_step384/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c097fb81cb08a41affe1e7830cf8ad7881e1265de169d80c4a1871b18c79f938 +size 18767001 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-384/tokenizer.json b/dapo_lora_r8_20251129_135342/checkpoint-384/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..1a2db243e47cbc113f6b2ddcc388aeeb8fe1a94c --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-384/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893 +size 11422778 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-448/adapter_model.safetensors b/dapo_lora_r8_20251129_135342/checkpoint-448/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..593b215d8476c658a0bdea45887ef05f6721327c --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-448/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8238498f128eb856256189b949c0a4d19943d4583e12a047a30ff5c4b3fdea80 +size 18516456 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-448/global_step448/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/dapo_lora_r8_20251129_135342/checkpoint-448/global_step448/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e39b7d22aa3a9f19701e9db633daff6337dad999 --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-448/global_step448/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad8c649c71c4498dbccc6aa2db0ed2fd906da2fff2a11aefa7e24447457d6fe6 +size 27711557 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-448/global_step448/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/dapo_lora_r8_20251129_135342/checkpoint-448/global_step448/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f3f9ab9fdfa8bdbfb581f6da211589e2585aaeac --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-448/global_step448/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:535c02c13626c51bc74451d0c3c60c508d70a409474a5143acc931d98913c2ae +size 27711621 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-448/global_step448/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/dapo_lora_r8_20251129_135342/checkpoint-448/global_step448/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3e51dfcdec90ccdbd9891c9a5528a4173815496d --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-448/global_step448/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10bd2b42371da1b3b39fb628f631cbb4e388c536a09a7cf6dce59e4eda4dbc2a +size 27711685 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-448/global_step448/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/dapo_lora_r8_20251129_135342/checkpoint-448/global_step448/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..40415ea56a60ff0e5f26f26c4c0fcc32e6ab328c --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-448/global_step448/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e9f28546383f017ef3a84be230fcf34520e84cbf00a26a4c9db3d345437c34c +size 27711685 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-448/global_step448/mp_rank_00_model_states.pt b/dapo_lora_r8_20251129_135342/checkpoint-448/global_step448/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ab3b06298bd99c82e9b3858d0437de66a9ba84e9 --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-448/global_step448/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7889bf19e91bdf5402c9a891d544c9e4783308a48ad839f648f8c36ed00552a +size 18767001 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-448/tokenizer.json b/dapo_lora_r8_20251129_135342/checkpoint-448/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..1a2db243e47cbc113f6b2ddcc388aeeb8fe1a94c --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-448/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893 +size 11422778 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-512/adapter_model.safetensors b/dapo_lora_r8_20251129_135342/checkpoint-512/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..84bfaf7b3e1995a31534d68ba922ac8a13c8e5a9 --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-512/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a2c1e20c5752210740bd37036a6b63dd967aef344587d619bc9ab5f62c0f89e +size 18516456 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-512/global_step512/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/dapo_lora_r8_20251129_135342/checkpoint-512/global_step512/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bbf971d5c29824cfa7daa39ddf4200bf06acc4a2 --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-512/global_step512/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:000f72d879055f03073deeefead47b5f93e4f757b186be1e6374e71d81578a53 +size 27711557 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-512/global_step512/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/dapo_lora_r8_20251129_135342/checkpoint-512/global_step512/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9d0fb7f66595c1c822063df355dc152d541c9c3f --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-512/global_step512/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6930aceb9ba41aeea96e576e764704cd27ca4f649887feb6889d9cd5e682af46 +size 27711621 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-512/global_step512/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/dapo_lora_r8_20251129_135342/checkpoint-512/global_step512/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4ae0f3228b100a3495ee79d4d34dd126562b191f --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-512/global_step512/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9dca117b34627e1c5c3e7080b9cf7ef7568b25ba714a23b2b046bc2a78a8fb67 +size 27711685 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-512/global_step512/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/dapo_lora_r8_20251129_135342/checkpoint-512/global_step512/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..66ea20d18d47b9ccbede71a6a185f4bb2845c265 --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-512/global_step512/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:47929a3f750a14625d3c303b272cb358eea7aa76b338413c8d0fc7a1c38a5455 +size 27711685 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-512/global_step512/mp_rank_00_model_states.pt b/dapo_lora_r8_20251129_135342/checkpoint-512/global_step512/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f52d7f5e9ff7bd070529b723b0ac709557d3c7af --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-512/global_step512/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd1266b2af104eff9db387b2d64fa1555e975daf3f2de8c647499475f3fd10da +size 18767001 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-512/rng_state_3.pth b/dapo_lora_r8_20251129_135342/checkpoint-512/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..40e9f6c539d58e519903b95e6c41e51eaf65126b --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-512/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85f362066d8aba5d721bdf9556c521eeff0b3d7fbd1dc8a79d1ca0070527c4d4 +size 15429 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-512/tokenizer.json b/dapo_lora_r8_20251129_135342/checkpoint-512/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..1a2db243e47cbc113f6b2ddcc388aeeb8fe1a94c --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-512/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893 +size 11422778 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-576/adapter_model.safetensors b/dapo_lora_r8_20251129_135342/checkpoint-576/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f956437ee71e0ba542eb5d92b686edf055c1e0cf --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-576/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5815ad08551206bb582b7f1e0f826fc7c8e593fd4f474ea1a363b13f8c24542 +size 18516456 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-576/global_step576/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/dapo_lora_r8_20251129_135342/checkpoint-576/global_step576/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..47f92c06bb14206d9e6c4038bd4341184eeabf18 --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-576/global_step576/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e09f75a3d7ab2e18c8d8f3bffb023b30e08de802b3c19fc6f4d29a17bbe9f884 +size 27711557 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-576/global_step576/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/dapo_lora_r8_20251129_135342/checkpoint-576/global_step576/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0fa426bb6ddd72d1a6dd4426700eff6e7f55dfb9 --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-576/global_step576/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a12a65bd975e11f21c07d12b820c8fdb4dcfb1471e60091959506e319af8610e +size 27711621 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-576/global_step576/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/dapo_lora_r8_20251129_135342/checkpoint-576/global_step576/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..065ca64b7ec22a048d608efc17c0d5381c4422c2 --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-576/global_step576/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0171b8425deac96ab77e61374e9ab7f73d87743fa26c7708e4710d8d953407a4 +size 27711685 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-576/global_step576/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/dapo_lora_r8_20251129_135342/checkpoint-576/global_step576/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d50d1c87dee95d38f0847b782339784edd7d7979 --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-576/global_step576/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d23fb86a6e82f9fdb3ebd14f87063fcdca1b6545e729124cd6ba6081c3dd414 +size 27711685 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-576/global_step576/mp_rank_00_model_states.pt b/dapo_lora_r8_20251129_135342/checkpoint-576/global_step576/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..05b76b847251665b800c5f5d1bf4e04e9c24ff8b --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-576/global_step576/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed1c621da5f7b3963f4cc2d82d60e52a601da9e0cae5246a51df3e8d20c0f0c4 +size 18767001 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-576/rng_state_0.pth b/dapo_lora_r8_20251129_135342/checkpoint-576/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..d88b9cc18dd261a6d6b06d5e9c676a65d5da42c5 --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-576/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc907c73dc42aa4b5ec9665b69b7958039ef4f6a86f1e52299dd13acf4b6d2a4 +size 15365 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-576/rng_state_1.pth b/dapo_lora_r8_20251129_135342/checkpoint-576/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..3d6b885788467ce279d45b9c003773b31e9e759a --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-576/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c1fc7011ddc5b764a1b6b1fa68d71578cd6a8c7eb65f7683ca3cc2455bc33fa +size 15429 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-576/rng_state_3.pth b/dapo_lora_r8_20251129_135342/checkpoint-576/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..f5cf07f630067629822c93066c0215f418bed4d8 --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-576/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c7cad50f84c70c4d46fc6a766b3ba637ed3a520c046b9ef62b8903fccb5841c +size 15429 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-576/scheduler.pt b/dapo_lora_r8_20251129_135342/checkpoint-576/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..454813a4990df191f6951cdef743cc653ff31f83 --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-576/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:105f4404298e62d6811a76a80078eaf19c435d835ba8926a324f78dfdc9fb5f1 +size 1465 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-576/tokenizer.json b/dapo_lora_r8_20251129_135342/checkpoint-576/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..1a2db243e47cbc113f6b2ddcc388aeeb8fe1a94c --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-576/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893 +size 11422778 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-576/training_args.bin b/dapo_lora_r8_20251129_135342/checkpoint-576/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..489d1fc6a9879879650b9a0275141e44deaac832 --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-576/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e591d12c15a6576f59af6858dbccfa77b59d60b21ef7a813c92a6711b9106af5 +size 8849 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-64/adapter_model.safetensors b/dapo_lora_r8_20251129_135342/checkpoint-64/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..cc7641d6da2251890825027cb3bc3d9b29ccf647 --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-64/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f8450fa5dcf918f239312150b53016d1349a231b08770ebf7152fc5e98b4da0 +size 18516456 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-64/global_step64/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/dapo_lora_r8_20251129_135342/checkpoint-64/global_step64/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..00ba32ccce5527d7f07ab9ea9e0f3739c0df8bed --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-64/global_step64/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8761b9ed5c52345619ba9c62a0cb382dab4ddb73e462493de379eb90a465434d +size 27711557 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-64/global_step64/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/dapo_lora_r8_20251129_135342/checkpoint-64/global_step64/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ce0f6823d2eeed3aaee4d143e0f1c7964880ee4 --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-64/global_step64/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:205e8e4a948cc75200314fa5da7389edc41056533b3a327cc7a752ee5b8e1f22 +size 27711621 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-64/global_step64/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/dapo_lora_r8_20251129_135342/checkpoint-64/global_step64/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae8f79cbb10e7fd3090517cf35b699be148f2e9a --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-64/global_step64/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86d3e4bfbaefa4db12d08546d0377d9c345a2a6b5d9085be5d499f48b5b60bc5 +size 27711685 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-64/global_step64/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/dapo_lora_r8_20251129_135342/checkpoint-64/global_step64/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1322349fedb223fcd37c92d87fcaa5eb4f8ed6d9 --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-64/global_step64/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:526f506bcf3e7d6c00a04a11ccfe27a0ce20d8a4b0a06d1b62b17e8f998464c2 +size 27711685 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-64/global_step64/mp_rank_00_model_states.pt b/dapo_lora_r8_20251129_135342/checkpoint-64/global_step64/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a8948d50e122b7901caa9ca89676e57169bfa63b --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-64/global_step64/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c946136a65abea60fcf1e2d92f23349ebb01cd25a24268cf9e37dd584a66b3c +size 18767001 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-64/rng_state_0.pth b/dapo_lora_r8_20251129_135342/checkpoint-64/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..c43d7697fb63e1d3488c0dd291b6d6c903a4e152 --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-64/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:762298d02aee6b74ff75cdf10600bfc96cf6498a50016304ee7d41ad62c305cb +size 15365 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-64/rng_state_1.pth b/dapo_lora_r8_20251129_135342/checkpoint-64/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..d4ee225956b55c28c377b311804a79131ff43958 --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-64/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:886405a183edff7d5f359707ab7228d841a76fe8772dfe3e702c1646b7a71a25 +size 15429 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-64/rng_state_2.pth b/dapo_lora_r8_20251129_135342/checkpoint-64/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..59d30ca903d22327264a8e8a2886adeeb8573b24 --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-64/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72a16d74927539d62bea565fab7a894369f3001474d22bd01a9a69f07c82ed9c +size 15429 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-64/rng_state_3.pth b/dapo_lora_r8_20251129_135342/checkpoint-64/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..77caa73e71e2aa17b6937c24f3897d0ea9f0c93d --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-64/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca954bba12fe215b1825ccecb1fef24989215987e29776babe596b506d6ce8a3 +size 15429 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-64/scheduler.pt b/dapo_lora_r8_20251129_135342/checkpoint-64/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..5f18e6fbca95d9546e2f67129f5c8f7ba7da9e16 --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-64/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93cefd10607223128e502b13dda034a13939769cee1c2b5c47751dc1ef0425c6 +size 1465 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-64/tokenizer.json b/dapo_lora_r8_20251129_135342/checkpoint-64/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..1a2db243e47cbc113f6b2ddcc388aeeb8fe1a94c --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-64/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893 +size 11422778 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-64/training_args.bin b/dapo_lora_r8_20251129_135342/checkpoint-64/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..489d1fc6a9879879650b9a0275141e44deaac832 --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-64/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e591d12c15a6576f59af6858dbccfa77b59d60b21ef7a813c92a6711b9106af5 +size 8849 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-640/adapter_model.safetensors b/dapo_lora_r8_20251129_135342/checkpoint-640/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6fa526e276fd0b685f4395b0d222ac690ccea6ae --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-640/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:388bba101c1ac930bfbc5ddb88ced5405cfa80696281bb89e5692967cbb07fc1 +size 18516456 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-640/global_step640/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/dapo_lora_r8_20251129_135342/checkpoint-640/global_step640/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b103af8d20d831cae87a278dee5f5a145b6b9848 --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-640/global_step640/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b149c7a8f3cb1767ce6aec6bf7d8b4db7be041f530f5fd6e032792e2768e42f +size 27711557 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-640/global_step640/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/dapo_lora_r8_20251129_135342/checkpoint-640/global_step640/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..026a46519326af0092364069dfe18265ff6f40a6 --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-640/global_step640/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99fc971799d38f632ec12762e5a5e8d0ff6b7ff03a30f71c17b5585257e259d5 +size 27711621 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-640/global_step640/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/dapo_lora_r8_20251129_135342/checkpoint-640/global_step640/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..81ad7f61131161225edefc14208afdd9ae0b5fbf --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-640/global_step640/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c20d581dda18946642db9e86c9df7e1ceddca6d9691e3e92e85c4a4e085f886 +size 27711685 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-640/global_step640/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/dapo_lora_r8_20251129_135342/checkpoint-640/global_step640/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ecd73f5c7fb39bba2e345cd337961a23e2e1c8d4 --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-640/global_step640/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e44c2fcb416078aef621b24ad908a1d45af12460882e15efc9ebb0de755d5b8 +size 27711685 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-640/global_step640/mp_rank_00_model_states.pt b/dapo_lora_r8_20251129_135342/checkpoint-640/global_step640/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0edd7d1b96eb67a6d6c6078455d9d61bd880b74e --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-640/global_step640/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d5593e0e019662627d3f36a07e5630da199a142a6061eda2be90919d3ab55ae +size 18767001 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-640/rng_state_0.pth b/dapo_lora_r8_20251129_135342/checkpoint-640/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..e1cbcc8ee5fb01a50439f47299ba46b429743ef3 --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-640/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab80bf0f127992db7a0876cbc5340b22d8c1442c875c4385f77c4ff21216b7c8 +size 15365 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-640/rng_state_1.pth b/dapo_lora_r8_20251129_135342/checkpoint-640/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..42f1506f1e6ef0c835074d72ee8a61a93ec44e98 --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-640/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec43dcf56ab16849078a17a3e8d669783c475ca99d79a9ae0bda01b68331c2c9 +size 15429 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-640/rng_state_2.pth b/dapo_lora_r8_20251129_135342/checkpoint-640/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..3b3a502fc1cbf34f609fefade9a97a816eb2cf57 --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-640/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c71169063121ece622c35397b500317501452326836ac1efd8766bd48a51e067 +size 15429 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-640/rng_state_3.pth b/dapo_lora_r8_20251129_135342/checkpoint-640/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..4d13ede87eb706d52f30d790927a8bb004272f81 --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-640/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3819615a79d442e7a7448364a476a404ce0a8c6f3366e5f109bb026daed0b482 +size 15429 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-640/scheduler.pt b/dapo_lora_r8_20251129_135342/checkpoint-640/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce72654f572f2506f27160b816a295cb0b390c16 --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-640/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a218931437f4ccf43b090350bb40ee3df136a61635dc16c5ca38673a829c2bdb +size 1465 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-640/tokenizer.json b/dapo_lora_r8_20251129_135342/checkpoint-640/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..1a2db243e47cbc113f6b2ddcc388aeeb8fe1a94c --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-640/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893 +size 11422778 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-640/training_args.bin b/dapo_lora_r8_20251129_135342/checkpoint-640/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..489d1fc6a9879879650b9a0275141e44deaac832 --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-640/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e591d12c15a6576f59af6858dbccfa77b59d60b21ef7a813c92a6711b9106af5 +size 8849 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-704/adapter_model.safetensors b/dapo_lora_r8_20251129_135342/checkpoint-704/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7a117668e8a7b1fe2d9270d9b57fb426e55aa86f --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-704/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a1d3e7f80e8c804d3ce8adf060f0d81ead87f80b3fef89aa904d9b947f707d0 +size 18516456 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-704/global_step704/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/dapo_lora_r8_20251129_135342/checkpoint-704/global_step704/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5a860901c5948ca97f70e813d22de62c5c3b8122 --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-704/global_step704/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:730cdaa60d261f693b8915de137e0dff42d30c854fd2c8dcd6e8315200cad669 +size 27711557 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-704/global_step704/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/dapo_lora_r8_20251129_135342/checkpoint-704/global_step704/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b04ea720d69ca33bda5573c0a108fa619a7a2058 --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-704/global_step704/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2909492cd5fefc14244f6d976c3ad77590f05807ac6886990e18c3def076183 +size 27711621 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-704/global_step704/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/dapo_lora_r8_20251129_135342/checkpoint-704/global_step704/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d71cb4eeb391c778f8039077d84a960fe5db778d --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-704/global_step704/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a9a2b774a873a5db0bb3bd656770c3cadd768b72dee3c0bb5c31d2a962649a0 +size 27711685 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-704/global_step704/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/dapo_lora_r8_20251129_135342/checkpoint-704/global_step704/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d9aa98a8a2413753ffee7204c6af247426297aae --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-704/global_step704/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:339d7b937f7c60c46591d2ecde07e684b0f833f832c7aede43b04ab7448339f4 +size 27711685 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-704/global_step704/mp_rank_00_model_states.pt b/dapo_lora_r8_20251129_135342/checkpoint-704/global_step704/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce7f8533b4d46f970b8f9df222f37eca59579324 --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-704/global_step704/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c04d3ae7880ff0a65c07ea67aa0d6c4e077ca68cab3521f9fc17fe4e0fc4549 +size 18767001 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-704/rng_state_0.pth b/dapo_lora_r8_20251129_135342/checkpoint-704/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..036199503d8fff5a06b1a7cf96549f9de917cd00 --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-704/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0290b858f95e4cfbd49b1760323c8266ad4af6be2e3e9986fd4d2279d214d0a +size 15365 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-704/rng_state_1.pth b/dapo_lora_r8_20251129_135342/checkpoint-704/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..7484bd69463f70237665f343440a05ebbf3ac7a5 --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-704/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd0cde94c8f01a092be35f4d1298583faf751c4ca167d3df36b43ec1f5a289bf +size 15429 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-704/rng_state_2.pth b/dapo_lora_r8_20251129_135342/checkpoint-704/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..6828e4852601bea16d03ec72da55abd7051e9bfc --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-704/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0dfcdab6b325ce98e5239abe5fc01d6161aca1626d66e4f1bcbed203b8a4cfc1 +size 15429 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-704/rng_state_3.pth b/dapo_lora_r8_20251129_135342/checkpoint-704/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..3c20b35cc84ca0ad7a236ed71bef21a46bcefd9f --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-704/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c728735b462a6f7d4e91e6757b5a38d58fe6580296a4c4cdf4d14e9196a9a10a +size 15429 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-704/scheduler.pt b/dapo_lora_r8_20251129_135342/checkpoint-704/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..fed940bed83776fee227b5936c168e6282b54594 --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-704/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11998cc5f35748b7722fb0b2c7a077a4a3e3b00ac72b4ef20efa3259e7892c63 +size 1465 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-704/tokenizer.json b/dapo_lora_r8_20251129_135342/checkpoint-704/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..1a2db243e47cbc113f6b2ddcc388aeeb8fe1a94c --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-704/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893 +size 11422778 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-704/training_args.bin b/dapo_lora_r8_20251129_135342/checkpoint-704/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..489d1fc6a9879879650b9a0275141e44deaac832 --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-704/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e591d12c15a6576f59af6858dbccfa77b59d60b21ef7a813c92a6711b9106af5 +size 8849 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-768/adapter_model.safetensors b/dapo_lora_r8_20251129_135342/checkpoint-768/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5639f74eaa21eb34357759e7384a4653ee80eae4 --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-768/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea63ce5e5f550629fb7eb150a21ee7ded1d8c6c4b197284b8a42f3c450311bed +size 18516456 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-768/global_step768/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/dapo_lora_r8_20251129_135342/checkpoint-768/global_step768/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b5d24017e03017b9d2d77359deff2f6233b7fce4 --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-768/global_step768/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49e53e6e1526f64a66ddac88186160128603201013cd364a89afe9d3c545638d +size 27711557 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-768/global_step768/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/dapo_lora_r8_20251129_135342/checkpoint-768/global_step768/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f9b291fa30c88cd1c828481cc4522f349e3ab075 --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-768/global_step768/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4609c4a1548637388f0d90cd2ff8b8c77abaf0ac07283fbe963040eca48df840 +size 27711621 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-768/global_step768/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/dapo_lora_r8_20251129_135342/checkpoint-768/global_step768/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd022710df0c6072b7667bc3489e9955a7ab1a81 --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-768/global_step768/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:970142ce6c3d91594fc4b99b108ab6054ff75bd9098741657912122645bdbdb3 +size 27711685 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-768/global_step768/mp_rank_00_model_states.pt b/dapo_lora_r8_20251129_135342/checkpoint-768/global_step768/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..40947b8760f7715a90d14e6f23c823c2bb4712f0 --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-768/global_step768/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1dea0eae1ab9d544c1a618d2cceebfc254633d62ee0954c90d7978c1da760277 +size 18767001 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-768/rng_state_0.pth b/dapo_lora_r8_20251129_135342/checkpoint-768/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..318b67fd6d0bbc4a9745d49808b3da325d530ccc --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-768/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:785c146129df3aa744c86d0e5b8737dc40f375ff6af22218885825bfc67f3348 +size 15365 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-768/rng_state_1.pth b/dapo_lora_r8_20251129_135342/checkpoint-768/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..822c4ccc5d82d869075f60823c1e0f03d0b6ceab --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-768/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2442cf692ca20b5cf060c05740efc256ec69c573a22b4ccb9d7fb66a0ad3b6a7 +size 15429 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-768/rng_state_2.pth b/dapo_lora_r8_20251129_135342/checkpoint-768/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..22a108abc6442c77200c4a20317163939ce0ba3b --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-768/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64fa342453499f4d7444315728a77c4043d53df7b6328a588c6abef871e5ab25 +size 15429 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-768/rng_state_3.pth b/dapo_lora_r8_20251129_135342/checkpoint-768/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..7cba13ab464923c1ff0999d35dc9007727de387d --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-768/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3d906426f88ff0d43676840e656c0919de713065a4b5a24eafea2823bbdbd81 +size 15429 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-768/scheduler.pt b/dapo_lora_r8_20251129_135342/checkpoint-768/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..ba0371866ff4c56375788d8e6b6ac204eca2f3b8 --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-768/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c26f336522cb69594b3952d10c9ee7899a17aa4a8eeeb9d1b384b971fa4c183 +size 1465 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-768/tokenizer.json b/dapo_lora_r8_20251129_135342/checkpoint-768/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..1a2db243e47cbc113f6b2ddcc388aeeb8fe1a94c --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-768/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893 +size 11422778 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-768/training_args.bin b/dapo_lora_r8_20251129_135342/checkpoint-768/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..489d1fc6a9879879650b9a0275141e44deaac832 --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-768/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e591d12c15a6576f59af6858dbccfa77b59d60b21ef7a813c92a6711b9106af5 +size 8849 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-832/adapter_model.safetensors b/dapo_lora_r8_20251129_135342/checkpoint-832/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a7ba85dabf6d6418ce2177b5c890158405d70ff4 --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-832/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e75adb3d484c4cb34d31012960e179f2d8d304979092b71cdde2f4377a5af478 +size 18516456 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-832/global_step832/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/dapo_lora_r8_20251129_135342/checkpoint-832/global_step832/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d9e71dc62f86c3283cb322d118a2d734a6553299 --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-832/global_step832/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73dfdcce07ec2c882181f686aa918da145c530c722de3f38063aaa3eb22133b3 +size 27711557 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-832/global_step832/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/dapo_lora_r8_20251129_135342/checkpoint-832/global_step832/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef8308d98b03c47a84b27d7c1a9a28ef5451e3fb --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-832/global_step832/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fbb0e225b42590f9837f59b0ed8c849832ca80f4ed66f0c389511827d5e5b696 +size 27711621 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-832/global_step832/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/dapo_lora_r8_20251129_135342/checkpoint-832/global_step832/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..73fb54a455c6ae2aecdddeb6d822192c35f6b617 --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-832/global_step832/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e043928c80cd47e638cee28225cb5e8f5226ecb03978ddf248648b9558d200f3 +size 27711685 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-832/global_step832/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/dapo_lora_r8_20251129_135342/checkpoint-832/global_step832/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f0d684a0161d44fc957f05ecd09506006184ea18 --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-832/global_step832/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a0bbfcdef1d316bc2a5ebe9327ac55ac365e4103a343f39bc5180f05ab2dd40 +size 27711685 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-832/global_step832/mp_rank_00_model_states.pt b/dapo_lora_r8_20251129_135342/checkpoint-832/global_step832/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..60d9aded1c72e6a8c7b397b61d1033d4a4b715e4 --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-832/global_step832/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:caa94e6ea5fe60ba78806fabdad2b0f67d074d526d93895c0ce67ac5214ecf3e +size 18767001 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-832/rng_state_0.pth b/dapo_lora_r8_20251129_135342/checkpoint-832/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..52d4fddce858697f8eef7172e013366f73b0e607 --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-832/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:310aa282249799a2c8282d90adec6afacf73423e57b50443e26dd4bd147a6b88 +size 15365 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-832/rng_state_1.pth b/dapo_lora_r8_20251129_135342/checkpoint-832/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..9ca0de851e3630109144683c8ec5e2613574ccbe --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-832/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9816ba359f192c9629f2be68341f1feb1d77beb279ed471e4f6e35b4bc8c9e8 +size 15429 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-832/rng_state_2.pth b/dapo_lora_r8_20251129_135342/checkpoint-832/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..f12bcd42e5607240c76e8e33fc6fa5cbe73c5b08 --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-832/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c450145635f7ff1731b4d20a8b23259310180b92c3d1a5b0235f60f046299c85 +size 15429 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-832/rng_state_3.pth b/dapo_lora_r8_20251129_135342/checkpoint-832/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..975775f7337fb4a1c673e49c06921a1719c140e7 --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-832/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6106d79eaad292758d9fe4b914a97e241b5e1fb975bbaedc88c4144d592b4ecd +size 15429 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-832/scheduler.pt b/dapo_lora_r8_20251129_135342/checkpoint-832/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..8718467d126ce6bdbd53d0dbdd54da4de1ff11bf --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-832/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0d2ef8130fc98df19a3863a629f0a8a22986faed3b54d90a56462143208d671 +size 1465 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-832/tokenizer.json b/dapo_lora_r8_20251129_135342/checkpoint-832/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..1a2db243e47cbc113f6b2ddcc388aeeb8fe1a94c --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-832/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893 +size 11422778 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-832/training_args.bin b/dapo_lora_r8_20251129_135342/checkpoint-832/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..489d1fc6a9879879650b9a0275141e44deaac832 --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-832/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e591d12c15a6576f59af6858dbccfa77b59d60b21ef7a813c92a6711b9106af5 +size 8849 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-896/adapter_model.safetensors b/dapo_lora_r8_20251129_135342/checkpoint-896/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6e14b5808c26a22e40a8c595925a1fb0b746edd0 --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-896/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2cfd073fd2a35813d0226919f729c277df538b97f4e4ad3738745c89957aa154 +size 18516456 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-896/global_step896/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/dapo_lora_r8_20251129_135342/checkpoint-896/global_step896/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a29da215b7b91fd046623319be273237be1ec20b --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-896/global_step896/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d7d2e16fa574b3807337c3f552d59241d70356c076d458e48db43d98931724f +size 27711557 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-896/global_step896/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/dapo_lora_r8_20251129_135342/checkpoint-896/global_step896/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..484cae0ead851f865ef788f01a6295589c05ad2e --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-896/global_step896/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2bc42464903d422fbbe9d8acb17845319aba0c26cdddd0be5e6f1ed9293cbe52 +size 27711621 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-896/global_step896/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/dapo_lora_r8_20251129_135342/checkpoint-896/global_step896/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3255117f167d90235659f1cf683846fc3918a4e9 --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-896/global_step896/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee7601ef640251a89864f6a9d056731822329e9e56e36dcb85f2be28f1a5ff1a +size 27711685 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-896/rng_state_0.pth b/dapo_lora_r8_20251129_135342/checkpoint-896/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..487b88f9523eb875039335c99371af24a8ec2243 --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-896/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55207adae633e4d05fce8fb6f4235c2aa4962e559005ef50887275f566292ca0 +size 15365 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-896/rng_state_1.pth b/dapo_lora_r8_20251129_135342/checkpoint-896/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..5a8426da4c620e91132cb3b5330ed91049863d3b --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-896/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de97e244313ea24877f957487d8e37178bace8350f901e0df56a4edf901252dc +size 15429 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-896/rng_state_2.pth b/dapo_lora_r8_20251129_135342/checkpoint-896/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..2bcaceef13b5723baeac90237ebb8a2e5119f86d --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-896/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3fe25022cde496a7d34e21cea6b069d37379e01fd58350cdf68e418462228007 +size 15429 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-896/rng_state_3.pth b/dapo_lora_r8_20251129_135342/checkpoint-896/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..b133aeca439c71f16dae5bad1dbd1efedb2d3d6c --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-896/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:485b3440b98f06b7cfd82f591979e582cb1dde6bb78fbd05e14341b536f61167 +size 15429 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-896/scheduler.pt b/dapo_lora_r8_20251129_135342/checkpoint-896/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..5b4ecb0ccba616e482f4a3ec4b8e0a53368e6fbf --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-896/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8bfb7bfa2c34c711580edf233de0f324b5ef962a780aa91f27b4eb576e2588ab +size 1465 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-896/tokenizer.json b/dapo_lora_r8_20251129_135342/checkpoint-896/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..1a2db243e47cbc113f6b2ddcc388aeeb8fe1a94c --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-896/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893 +size 11422778 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-896/training_args.bin b/dapo_lora_r8_20251129_135342/checkpoint-896/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..489d1fc6a9879879650b9a0275141e44deaac832 --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-896/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e591d12c15a6576f59af6858dbccfa77b59d60b21ef7a813c92a6711b9106af5 +size 8849 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-960/adapter_model.safetensors b/dapo_lora_r8_20251129_135342/checkpoint-960/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9f3a535e83575a0888132b717ccd47f1ae2e8c6c --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-960/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45c06e8979de4341dcb8236acc8d65a31de96e282206a6b3b425dddcfa1cda22 +size 18516456 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-960/global_step960/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/dapo_lora_r8_20251129_135342/checkpoint-960/global_step960/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8f6077da10916bc6980416f9967a7fd7f7729b86 --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-960/global_step960/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35ba9d9c8e8bda8cd5c496f629b271ef598e1f73e79f34b6c6bd346e865e020a +size 27711621 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-960/rng_state_0.pth b/dapo_lora_r8_20251129_135342/checkpoint-960/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..fe7457cb26feba4aa022a1fd4b1f23be34a2619a --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-960/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2054b444b797aa73816f5a89883792cee9c874c6c458735ccf93b7fd6be9f346 +size 15365 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-960/rng_state_1.pth b/dapo_lora_r8_20251129_135342/checkpoint-960/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..4e812c0a95f0e53f7dfd87d4bff4863b1ebd07d3 --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-960/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:745871eff0c03cab3ba0dc904120fcbe34438c744276579fb77f29fda3914a5e +size 15429 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-960/rng_state_2.pth b/dapo_lora_r8_20251129_135342/checkpoint-960/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..097d44c87a5c8eec8aca3654cec1868af38fb33f --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-960/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf3f3a1db5da53cdcca5f20e392ffb5ba6e6bd449d468392ad2f15a606277d47 +size 15429 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-960/rng_state_3.pth b/dapo_lora_r8_20251129_135342/checkpoint-960/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..d78735832421f99a08cce4d61337b54197c99e10 --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-960/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa68b117f6ee632cf22ecdeedbf6bc16725ab5e10f14a2e30e80e489039499f7 +size 15429 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-960/scheduler.pt b/dapo_lora_r8_20251129_135342/checkpoint-960/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..9eb04204506c94bd661dad83fc4b7f80d132d458 --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-960/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0745cbdd2c0a3caae7131e38e031d01350e2e6b8404ec309e908eeec7592a96 +size 1465 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-960/tokenizer.json b/dapo_lora_r8_20251129_135342/checkpoint-960/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..1a2db243e47cbc113f6b2ddcc388aeeb8fe1a94c --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-960/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893 +size 11422778 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-960/training_args.bin b/dapo_lora_r8_20251129_135342/checkpoint-960/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..489d1fc6a9879879650b9a0275141e44deaac832 --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-960/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e591d12c15a6576f59af6858dbccfa77b59d60b21ef7a813c92a6711b9106af5 +size 8849 diff --git a/dapo_lora_r8_20251129_135342/tokenizer.json b/dapo_lora_r8_20251129_135342/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..1a2db243e47cbc113f6b2ddcc388aeeb8fe1a94c --- /dev/null +++ b/dapo_lora_r8_20251129_135342/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893 +size 11422778 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-1024/global_step1024/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-1024/global_step1024/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f34c8ef4d0aa2ce8c47bac9f99b76a19934e5634 --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-1024/global_step1024/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dbfe97453bf8df1fb86ef2c56aac1703bd2d82caa84c45d672af199a08976a7d +size 74329285 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-1024/global_step1024/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-1024/global_step1024/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cc91dc208d46a7022012989fe6cf9959b174dcb6 --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-1024/global_step1024/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a8e8a4b7f621ab5bb78fe9e503aaa1c44f20fa9c2baf463c22964d01ab68f06 +size 74329285 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-1024/global_step1024/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-1024/global_step1024/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad60faab9313be7e7e1ddb7b158e93300df75432 --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-1024/global_step1024/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64781bdb73275a2f7a1b4aa3e1a85be553ae4b99e8399b0f9c2275e817749b43 +size 74329285 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-1024/rng_state_0.pth b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-1024/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..9710775462c2ec5bc05a52d18cd8ad6bb4511fa7 --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-1024/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:266f5fc606d1722159b29672cfafa3adb5b37be9c4a64a8f7cdd818d464f99e6 +size 15365 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-1024/rng_state_1.pth b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-1024/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..fa419edec9b1f96af405ffd5e1ce528fef149c74 --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-1024/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08ce1f726f829bf7942861ed07e8096508f8a7b856b9777d3146a45c368a6c03 +size 15429 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-1024/rng_state_2.pth b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-1024/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..5f4ea67c1d464371c9008be63cad6bc0530b80c9 --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-1024/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8d13eb57a2bb9b2957bb5503c43f2a6918d6a8187ac0bac072445f4f5099c1e +size 15429 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-1024/rng_state_3.pth b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-1024/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..0d246ab48fb3102d853bf6f27f5607a47a0fcea1 --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-1024/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d71d8e8e15b57a2fefc871857da527d97231b4d0190adfa9192111c4e67005ae +size 15429 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-1024/scheduler.pt b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-1024/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..99d91d84ee7ce6fc15f8af630d20f12aec7f58eb --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-1024/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77a000cffeb82f679c5eea33f850666a8c70d17499ffc7879cf41417a213f90c +size 1465 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-1024/tokenizer.json b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-1024/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..1a2db243e47cbc113f6b2ddcc388aeeb8fe1a94c --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-1024/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893 +size 11422778 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-1024/training_args.bin b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-1024/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..28b57c2433d1f782fd9d6a2d566eacd7c01306ca --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-1024/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6e763c53379e58f5e941c941cb9ff1e9ea6ce682340ae670fa6af4ad661a269 +size 8849 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-128/adapter_model.safetensors b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-128/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..622568408c6b898e0e1d6ff5becefb9885e5342b --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-128/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a14b082217a1d0567c823616f5b72178356f8d444e34718a9e3ba4ce9203bc33 +size 49582616 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-128/global_step128/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-128/global_step128/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d77adea8e4155089fa4d6f7698ab76a50e5b19fe --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-128/global_step128/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9566740245ec2239f8f7f3cbe80d302d23d7e8bafbe2638378a36434c59b402 +size 74329221 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-128/global_step128/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-128/global_step128/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..32c41b007c2b188592370e5e4d21902931cb1640 --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-128/global_step128/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43d835f12e9ecce5236d4a0e0cdd776833ce4ef3c7fc9a8c07b7f8f3a8b6b8c6 +size 74329285 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-128/global_step128/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-128/global_step128/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1dc9a0f5242b8057494c63365349154b3158e5f7 --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-128/global_step128/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a19b751b0fdc8d824b1e071884bbef1dc621e3244b32ff7e00445934e9f39a2 +size 74329285 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-128/global_step128/mp_rank_00_model_states.pt b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-128/global_step128/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ff3e57f3e1e7cbdb4930b2659c70cbf87b785c35 --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-128/global_step128/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6354f0b2bd218a4a1b4e847d5c65bf4e5dfe3c1c447a479cea6a3862897ec826 +size 49768921 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-128/rng_state_0.pth b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-128/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..9b441d5a98dc2ab82bc18718ea6cf3c649ded943 --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-128/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:383f1592630be99279617a72b374eaf646ce700f3caa5f4b916dd46ed3c81c46 +size 15365 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-128/rng_state_1.pth b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-128/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..67ac0193519a65eabab31693c8028e2abe20c42f --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-128/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97e11b61b1180841e48c4e41ec4cdf0ed6a904fea61f4e949e8bffe096c990d9 +size 15429 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-128/rng_state_2.pth b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-128/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..0b99b1837f3e46c84a9124126379fc0561439528 --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-128/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2477003ed8e9c04ba3bf9d32167ac7fdb24bff48f3a61ab96fe43eb0efecbe1 +size 15429 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-128/rng_state_3.pth b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-128/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..10ef72c6ab7193e8e7e49b5feab0c86beab7379a --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-128/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d25ff54afd9734456af0db367317f1dcc9a5930fd983a42f384352fffb3516a3 +size 15429 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-128/scheduler.pt b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-128/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d08ae64295b57090bbaa5d6676253533d838873 --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-128/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a72d1751ecd37a23ecd20bd8b9260f394c2f370cb5db8d203bad7d01395f4fb8 +size 1465 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-128/tokenizer.json b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-128/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..1a2db243e47cbc113f6b2ddcc388aeeb8fe1a94c --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-128/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893 +size 11422778 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-128/training_args.bin b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-128/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..28b57c2433d1f782fd9d6a2d566eacd7c01306ca --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-128/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6e763c53379e58f5e941c941cb9ff1e9ea6ce682340ae670fa6af4ad661a269 +size 8849 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-192/adapter_model.safetensors b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-192/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8710dca29b549553b653bef913a89b225917897f --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-192/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73a912738983e0cfdeeb1a579951aed7c055bbb1bb933229b650b18f12dba9e1 +size 49582616 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-192/global_step192/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-192/global_step192/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c4d96b75db411c33d4c26b73236a39a40f8ffb8b --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-192/global_step192/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d814ccb87b36136ea4d404dc7d3e5c72845ea5a016311967c654c913abc76c29 +size 74329221 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-192/global_step192/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-192/global_step192/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dc5bd70b064c56f01810480ceb6f822f4d656f84 --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-192/global_step192/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f635b9c4c8dc1ebee2494fe4efd475fb852fadf5859c3288f19643d70e58d39 +size 74329285 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-192/global_step192/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-192/global_step192/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2b34aa8f7f9739045e52ccf3e71d0a8f6ff73465 --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-192/global_step192/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4dc2a7026461488067a2bf4af325762aa80cea2f946eff7870346b0a6cb945b4 +size 74329285 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-192/global_step192/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-192/global_step192/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c9ce86ea8ce1288b77f8a7a05d2a27d7858da36e --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-192/global_step192/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c32489b1aae34ea6434cf2d3ee94337e91c8fbda8e58f17533d076e6511bfbd5 +size 74329285 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-192/global_step192/mp_rank_00_model_states.pt b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-192/global_step192/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d874de8e1619eebacfda97745b504a1733f73460 --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-192/global_step192/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca7ad5c09503408ea5d973608dbd12142c4ef25473e28450c74d06683a4211f8 +size 49768921 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-192/rng_state_0.pth b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-192/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..46728bb2caec794525e0985a0c0d0dcc246780bb --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-192/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c9dcd145aaed58792ca37c2f0b344a17557df72394eebddcf82f446f60c2376 +size 15365 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-192/rng_state_1.pth b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-192/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..37820127599441d8ade7b2c15f68510a32299102 --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-192/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6fbdef72a2d5c7ee1dc2c3446cf01bd83fcfb34312b00c7205aed3fd04545d73 +size 15429 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-192/rng_state_2.pth b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-192/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..06ed340dfb49e4f16269dd6204175bd0b9cdf66a --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-192/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b2b4d34f8a56a9ae9f73f3de04850908b232799522983064bb8d09584c5377f0 +size 15429 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-192/rng_state_3.pth b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-192/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..794a922947b2b35335a79fefe24c63f1c5e995fa --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-192/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54a7951f210ee6f4771e17d615a8d03ccb16b36beb6c853533f8393df1589ee3 +size 15429 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-192/scheduler.pt b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-192/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb4e8900ca74d271df161df3e78c5e3163d3ca2c --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-192/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ac63e93328a0491bc31c5b67747712626467b0c1fab68bd8f3a90d2ffc2d318 +size 1465 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-192/tokenizer.json b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-192/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..1a2db243e47cbc113f6b2ddcc388aeeb8fe1a94c --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-192/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893 +size 11422778 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-192/training_args.bin b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-192/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..28b57c2433d1f782fd9d6a2d566eacd7c01306ca --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-192/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6e763c53379e58f5e941c941cb9ff1e9ea6ce682340ae670fa6af4ad661a269 +size 8849 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-256/adapter_model.safetensors b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-256/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f4c003fc8ffe65f8da47d326347413a27ac54f9c --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-256/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ad8f34e10da2d78bc1307c2bbb7f2755a6f6e565a534bafca1b2b35535674b5 +size 49582616 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-256/global_step256/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-256/global_step256/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c8201aee9586d99137388286f1dd4cc8ce41eee --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-256/global_step256/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37d063de85ce6f54401c0a4a857314e7f3317869e93451a83282ca38bd18eef2 +size 74329285 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-256/global_step256/mp_rank_00_model_states.pt b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-256/global_step256/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..28144d582baef5758151e0ec8b7124bf6d8b2a12 --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-256/global_step256/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e619ca2405e4b1df089313634c4b12083b32ec08b5679aea07f1355c680078be +size 49768921 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-256/rng_state_0.pth b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-256/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..64df028d6bc4ea16b97c982af73c131b83cba64b --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-256/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:501939aa197042b9d6c139b455de1fd37718169f130e7d243c863d622252bfae +size 15365 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-256/rng_state_1.pth b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-256/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..d65a32a42f626c551a1f8bc7f941d7fbbfb3a8a6 --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-256/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e565268765a546d48b8b032edcb4ac3b4886b441c888d7e402da44ddada1579 +size 15429 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-256/rng_state_2.pth b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-256/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..514dd182eba9fb5a6651d72ce2d9c7a93e697f83 --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-256/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f53994bdabb93a0f181d5cb70d32b6670b7910d9e64decabb0ea6e210a5fa9c +size 15429 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-256/rng_state_3.pth b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-256/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..e03f221a86e29b415639817456423bc20cd2ca99 --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-256/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3e7d2c57208aaa33622adee77513352c93914750c6961364accef4b5a80de83 +size 15429 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-256/scheduler.pt b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-256/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..5da175406e5951634027623c46687436be96a222 --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-256/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8495f527d2ae384d255f961a1b604892e1f5459d17e99146a7b64167ecb9365 +size 1465 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-256/tokenizer.json b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-256/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..1a2db243e47cbc113f6b2ddcc388aeeb8fe1a94c --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-256/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893 +size 11422778 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-256/training_args.bin b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-256/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..28b57c2433d1f782fd9d6a2d566eacd7c01306ca --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-256/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6e763c53379e58f5e941c941cb9ff1e9ea6ce682340ae670fa6af4ad661a269 +size 8849 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-320/adapter_model.safetensors b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-320/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e44d88fbe0324da31a1bfdbf3f5daa0719980a90 --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-320/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f56e441e0b7c4d16ab65f38fe79b2ed05166dc471196450842823a3c80d03e78 +size 49582616 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-320/global_step320/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-320/global_step320/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c175cd5c6a00e9b2e0988bf578f9eba8f87195e --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-320/global_step320/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7759b34d8f7ed3a8d7d426fc1cab375104b16731ae8c948c7a1885a314100d6c +size 74329285 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-320/global_step320/mp_rank_00_model_states.pt b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-320/global_step320/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..95903218299c19f5db5b293a5d94c962d802934b --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-320/global_step320/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f2e9809cf74039bea5ea93331458b9ead49bd4d183aaa4b4ee5ad8882d2cba3 +size 49768921 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-320/rng_state_0.pth b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-320/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..8eacc08ab90adc5505df8cc336355365033c1fe2 --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-320/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:121eff411f947a807dcfffcac51cebeb78e8842e7180ccd7cfd5144193238f7e +size 15365 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-320/rng_state_1.pth b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-320/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..1a22c627bf3ba04fb242330087b69883b55a617f --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-320/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8c9e3ed82ec69cf8bbd9cdfd0da60f74009fd4e5466397fa73790b86f2b1264 +size 15429 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-320/rng_state_2.pth b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-320/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..d551d0951d3e21c77472614842bb77e275e888d7 --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-320/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:974a08dd3b1ffc21fb0b9c323aaa932ed3e77a82964caa6e355975fc413bedc6 +size 15429 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-320/rng_state_3.pth b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-320/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..eececbeedddcf1f798fb1a58bb5794e43a108dc3 --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-320/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d55161f24b7b367cf301f16407a2e52664cc01dcdfcc4e0d7f898785408c7f7 +size 15429 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-320/scheduler.pt b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-320/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..0b635ce1666c50e816d388484f117d6c351b92d3 --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-320/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da013ae0b2b98d7666c2dc2fe7c1c09f26c72a818d58bd9b5b49a1d1f432bd5a +size 1465 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-320/training_args.bin b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-320/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..28b57c2433d1f782fd9d6a2d566eacd7c01306ca --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-320/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6e763c53379e58f5e941c941cb9ff1e9ea6ce682340ae670fa6af4ad661a269 +size 8849 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-384/adapter_model.safetensors b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-384/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f6e1e28f1902545c54d7057d27259071e4017e38 --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-384/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32255f7718e5bcc01d503e9c285528cccd4fb5ee2590f98442990a6cefaeffd8 +size 49582616 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-384/global_step384/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-384/global_step384/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d43d5f214ce016e9b65e977cf91230e35af8cb6f --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-384/global_step384/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f5ea498b914c30ec6064ea0fafad5239d9a71955ae6e611c997de37a6ac1b0d +size 74329285 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-384/global_step384/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-384/global_step384/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e433225cf469a522e6ddb5ea2a4263fe23253eb4 --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-384/global_step384/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d2dfa2e4f1fabdac193f52771aa5066227608bb2580e4b897d975115b733f7b +size 74329285 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-384/global_step384/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-384/global_step384/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..457b97f775a58ebc799a506b82718b59f84fc8aa --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-384/global_step384/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:987f7c5615596216d71e9f78fe6e37f63c75acaeb63faf3ddb71f2c1a3819090 +size 74329285 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-384/global_step384/mp_rank_00_model_states.pt b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-384/global_step384/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3296d58d61c08e1916dbd5d8984e03b924f46d42 --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-384/global_step384/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a469d71cce863d763763a080db0632442435ca89376f966d8cefd23872325307 +size 49768921 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-384/rng_state_0.pth b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-384/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..d573f5772777cb30aa04bd58e21ca2c7c09f2f52 --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-384/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7d29abb0c55c83e0b5550542d7a76f096cf49a8926971e527e4af02247ca0eb +size 15365 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-384/rng_state_1.pth b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-384/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..ee9cc4403233cf9358adac144e98cc19a865c72a --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-384/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64e7d628f4a2d1da57e1c3b581a61fa546fe49c91264542897e7597f8d5794ce +size 15429 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-384/rng_state_2.pth b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-384/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..06e97c508a6bfca76afd7ffcd2d74b6b5e5304f5 --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-384/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6590fdd7a669fc405a67b4abee39cf86aad9ad91450134d13c1c32c72dd07a2 +size 15429 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-384/rng_state_3.pth b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-384/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..edb5cc0f21d0bf14500241658831338fa5505c58 --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-384/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d388f363d829ca018f3bfef9c6a865ace91f76cd8e30a5960c041d2d194f9e72 +size 15429 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-384/scheduler.pt b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-384/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..e35447364346dd4e48ff2912c9630fa0d550dd81 --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-384/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a73b3132edc693a316dd18b0560b36c0fb0501d1030453a31a1309122a6bf7c +size 1465 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-384/training_args.bin b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-384/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..28b57c2433d1f782fd9d6a2d566eacd7c01306ca --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-384/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6e763c53379e58f5e941c941cb9ff1e9ea6ce682340ae670fa6af4ad661a269 +size 8849 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-448/adapter_model.safetensors b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-448/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..df2a44d534f47e6fb3cde17210a1b9fcbba8db36 --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-448/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ed123d3def52aaae596a1c4044aff4647302389db979310e86c5b39e3b98eb5 +size 49582616 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-448/global_step448/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-448/global_step448/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a1bf54e3300874ae6dfa999af3b32b08e4d3da1 --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-448/global_step448/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e85a6a28d4b782c4cf6fcc6df1a8679a458036c96c68faceb43095c83057186 +size 74329285 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-448/global_step448/mp_rank_00_model_states.pt b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-448/global_step448/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0ec3296760b15262c30b43c72eacfd09091d476b --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-448/global_step448/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e2155152bb0988e7bd0ed183993ee741aef69abaa1bee755c2392ffa14527fe +size 49768921 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-448/rng_state_0.pth b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-448/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..a1af6a7a2facbf2f2fe6b135fecb148addadfef7 --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-448/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c61415ba2bb7e7fe0fe1af8567d18f758811f9177c39441a1e7812907b05e484 +size 15365 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-448/rng_state_1.pth b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-448/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..e47efefc778c0cfa13c88a1ae33de13941777058 --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-448/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dfcc30d7b2e13a406177162ea8314144e2acb3d4cf9facfb15ec77e8436ac49d +size 15429 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-448/rng_state_2.pth b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-448/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..a5fab818a8afa83a462d6db9b3c92a5c4fb28d12 --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-448/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b2b37d507d0d4cdae14eaf4722242af723624388162f6981c17accaf8527935 +size 15429 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-448/rng_state_3.pth b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-448/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..fe7d604cc5e43894ebde8e3265edf04575824df4 --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-448/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e7eee740facd5e269cc8c9c923aa86fb2e064d55d5d214fe442998f4601ab57 +size 15429 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-448/scheduler.pt b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-448/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a39d5aae7a5de28bbf7c8e26531da9f7f0cda3e --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-448/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89d50e6c2130ded251cbd3fb239e3a2e1e0564766292c69bfb4aa6ba0d973844 +size 1465 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-448/tokenizer.json b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-448/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..1a2db243e47cbc113f6b2ddcc388aeeb8fe1a94c --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-448/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893 +size 11422778 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-448/training_args.bin b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-448/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..28b57c2433d1f782fd9d6a2d566eacd7c01306ca --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-448/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6e763c53379e58f5e941c941cb9ff1e9ea6ce682340ae670fa6af4ad661a269 +size 8849 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-512/adapter_model.safetensors b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-512/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8c62bf3fc19a4d567a263ae1422b266591380c7f --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-512/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b33bd05711c7ecac8a829b33411623ee40d18a8651e605dce688e8ac9803e7d +size 49582616 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-512/global_step512/mp_rank_00_model_states.pt b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-512/global_step512/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c92730f0fbe91ea7164f1e7dd94af49728b8e2ab --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-512/global_step512/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9196e5c0b92a4c3b3c9dda63873945cc740e7fc4b2f8eebb2608738c64b91762 +size 49768921 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-512/rng_state_0.pth b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-512/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..7065a4ecd08b3697c26831c4012af863a7a80413 --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-512/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:899ad682a33c43d6a28e156c57ac7241d896f44e7667fa98bbb1b249a03a7ac8 +size 15365 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-512/rng_state_1.pth b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-512/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..c6bfb4d3f4993d718def2370dc4f4a4bcfa42317 --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-512/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3bbccea25a877e52cb2d0984e023495916d0857caa2a5e37429fd0d4b769fccd +size 15429 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-512/rng_state_2.pth b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-512/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..2dba46acd99e1e31645f41c86b90b8114ed3091e --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-512/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e69a53c9d4ce0bdee9024386f91c0df2dd2806ec88a4b4703aa3add588fd4da +size 15429 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-512/rng_state_3.pth b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-512/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..51601b5906f149ace30358f8c38cad626f4d508c --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-512/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4c50e7a635eef449c92a4aaad86b5fd953852eb567a27dd0573ef97d024e073 +size 15429 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-512/scheduler.pt b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-512/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..4800a9e5803399b265ffcab0af9c3fe980dbd948 --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-512/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c0e61c4f166edd4bd232bd6fbefe6d67a5b7e00cb803d1741eac9a6d2b7b6ee +size 1465 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-512/training_args.bin b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-512/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..28b57c2433d1f782fd9d6a2d566eacd7c01306ca --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-512/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6e763c53379e58f5e941c941cb9ff1e9ea6ce682340ae670fa6af4ad661a269 +size 8849 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-576/adapter_model.safetensors b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-576/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..885532253bf709561f47471483e743492eb5fa43 --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-576/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2eba1f49cb355c5b76c467916147bd4db7856aed3fc60ab337b12af25de8b47b +size 49582616 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-576/global_step576/mp_rank_00_model_states.pt b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-576/global_step576/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7bbec8bd429fd458ad23ea4941782a0faec7558c --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-576/global_step576/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4930449ba119bd3f3d8a5088adcfe73abe4e7cf1225dadfba6ac719e1a848610 +size 49768921 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-576/rng_state_0.pth b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-576/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..6d3471d93f2741f4bc311e5b23ed2bd98a604c60 --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-576/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5071846bd9a2fe9c9d4d401a9f3e5fb7b0d294d7dc9b9bd79bdb3818fa836039 +size 15365 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-576/rng_state_1.pth b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-576/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..d6234308e30b82bf33859a60b3e6753460939c7f --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-576/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:848847613d0542e9f24a537e0aa298756e95235a594f98ad867c83fccd5ec366 +size 15429 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-576/rng_state_2.pth b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-576/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..7e8f4de1e41f67ce41dbcc0df1eba68aaa371d5a --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-576/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e448b9c4c0f22255ed3797668e14348ffcf65f1703d53e1ab719cd01fe0a75e7 +size 15429 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-576/rng_state_3.pth b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-576/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..d9a26f290f39b3a349f9f07e50f495839ae2a59d --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-576/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f98c7fda3df7709b0dbaf942a3070b9151ce7d8b2134b7c8538f456f7efc9b00 +size 15429 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-576/scheduler.pt b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-576/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..454813a4990df191f6951cdef743cc653ff31f83 --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-576/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:105f4404298e62d6811a76a80078eaf19c435d835ba8926a324f78dfdc9fb5f1 +size 1465 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-576/training_args.bin b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-576/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..28b57c2433d1f782fd9d6a2d566eacd7c01306ca --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-576/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6e763c53379e58f5e941c941cb9ff1e9ea6ce682340ae670fa6af4ad661a269 +size 8849 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-64/adapter_model.safetensors b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-64/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..536f292bd7e640d1bdfab61eab0177d6877188da --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-64/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0bc23530a80f81a0fba7c9a3ba5536fcff1d01970faeb216414f0ca1672f6c62 +size 49582616 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-64/global_step64/mp_rank_00_model_states.pt b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-64/global_step64/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3fc99d4b80362d30f7ffaeba80fde194c65e3ceb --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-64/global_step64/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2f4137fddfd17b8d8700a8e87033e6877044f96e6f4fa3c8b12a16aa810c5e6 +size 49768921 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-64/rng_state_0.pth b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-64/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..8f93437084b3392a8201c4de52d7f0d34b77acf2 --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-64/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d748747ec398fda132bbbc0b3be47d737fa34f2fcfbb0897ee27ecad247bde39 +size 15365 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-64/rng_state_1.pth b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-64/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..bc8e2eb51f359d3078d1f1f46ffa08931cbcf1d0 --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-64/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f46388640d7bc8c57ef2a4640e351453cedf50ac983ff663170ac2ad48c8a169 +size 15429 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-64/rng_state_2.pth b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-64/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..c58b5ee095779ce05069f546cf89e10f278c4726 --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-64/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f5f195decb7b597d40f99f1a72becfbe1346f0017b90531b170fd792110d99c +size 15429 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-64/rng_state_3.pth b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-64/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..37f49cf84edb349b6b7e05821640630a7e600080 --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-64/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:087a8abb310f72ac8c7904ff3f6427c20a388fd9db0eb4a4acc883d3f093799c +size 15429 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-64/scheduler.pt b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-64/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..5f18e6fbca95d9546e2f67129f5c8f7ba7da9e16 --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-64/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93cefd10607223128e502b13dda034a13939769cee1c2b5c47751dc1ef0425c6 +size 1465 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-64/training_args.bin b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-64/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..28b57c2433d1f782fd9d6a2d566eacd7c01306ca --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-64/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6e763c53379e58f5e941c941cb9ff1e9ea6ce682340ae670fa6af4ad661a269 +size 8849 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-640/adapter_model.safetensors b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-640/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9d556c7492b1e2d8cae257d5ee1648485fc4e41a --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-640/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c3916295d52932f2000ed4f6b6f3f5950f18e4ef582576569a62dde697a70b6 +size 49582616 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-640/global_step640/mp_rank_00_model_states.pt b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-640/global_step640/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a423a3085656db4397a4488b4f8779b3a379100 --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-640/global_step640/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c976e0ea9c037da4e895de05780673f8f583329d15ed7946c1494712c8e85d8 +size 49768921 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-640/rng_state_0.pth b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-640/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..314d099a6c86e60e30b7e2a7332865bc96f106bd --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-640/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ecc8a3bcee47352db0e7786519770d8f56e9c7136a5e6ae232a4c9eddf3281d +size 15365 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-640/rng_state_1.pth b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-640/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..9c2a6d63a09f4ae489e12b2a79f6dd3208e38110 --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-640/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3867253331fca83bb9ff45961c29c838117f77bce5b6b3ac7ddff1a4d3549e0 +size 15429 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-640/rng_state_2.pth b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-640/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..e0dad4b861e28713ce7ea60e9cc79317f9af52ff --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-640/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd0f786ef173b303cd0ca19e2067a1917b6a01aa313a495eb9aa94e98ac4905c +size 15429 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-640/rng_state_3.pth b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-640/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..ad9675de360858abdc21b3cbe4fd573c7d8d1bd9 --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-640/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ebe706cc5d6d406aafc213a1ef3160f37431b2c9e290df00c92645f6d6e76740 +size 15429 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-640/scheduler.pt b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-640/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce72654f572f2506f27160b816a295cb0b390c16 --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-640/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a218931437f4ccf43b090350bb40ee3df136a61635dc16c5ca38673a829c2bdb +size 1465 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-640/training_args.bin b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-640/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..28b57c2433d1f782fd9d6a2d566eacd7c01306ca --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-640/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6e763c53379e58f5e941c941cb9ff1e9ea6ce682340ae670fa6af4ad661a269 +size 8849 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-704/adapter_model.safetensors b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-704/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7d70caa93b3c27998f70d350793eee5f25629cbd --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-704/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d14d91451c5bb7fe51604e8517303a30b81ae3aa6a777fe57d0fd596b8d746e4 +size 49582616 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-704/global_step704/mp_rank_00_model_states.pt b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-704/global_step704/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..95af9f7900185b9e64015c383c622668da5a1cff --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-704/global_step704/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d80369e0047f53e1d4fb07e10f23b843141168e5abc304796c3675b459f4f536 +size 49768921 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-704/rng_state_0.pth b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-704/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..bfdb9c7a70cdee0f7eadb12c07b63d4d2df0aa5d --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-704/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fee3cd382d8ef2e97c08f2ca4b193ab299dd563c66b48e1546fca47e80b59352 +size 15365 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-704/rng_state_1.pth b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-704/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..444bd2d547afcf2cff7905a2d16ddd338884feda --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-704/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0e96b1c10ef2671fe130d2907a0bfbf15710d40c03393c6f51c92755fa1edbd +size 15429 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-704/rng_state_2.pth b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-704/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..c889a9e17e973c0e1ee96ed73ba10c2815be8380 --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-704/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d67cba4ff34c07977d8ba1b7b1d95743860628e1684817adcb31d643eea6c80 +size 15429 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-704/rng_state_3.pth b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-704/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..8ed5376ec2c059aa1e54ba2c1a6ae90a9686364b --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-704/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f54247fdbc4685d69f284ae661b7531ca9e308d02e15afef05b8a7f3fd049197 +size 15429 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-704/scheduler.pt b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-704/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..fed940bed83776fee227b5936c168e6282b54594 --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-704/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11998cc5f35748b7722fb0b2c7a077a4a3e3b00ac72b4ef20efa3259e7892c63 +size 1465 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-704/training_args.bin b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-704/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..28b57c2433d1f782fd9d6a2d566eacd7c01306ca --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-704/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6e763c53379e58f5e941c941cb9ff1e9ea6ce682340ae670fa6af4ad661a269 +size 8849 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-768/adapter_model.safetensors b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-768/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..06d437291c71c64cf6ac78e7ecb3e86406424a2a --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-768/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:002f2611968692e3d5e6a349b6af003811d3f4704679a5e74a4fa24d4c10de4a +size 49582616 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-768/rng_state_0.pth b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-768/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..77d1a271c95ee69d9debd8b27d5bf057bfc4d799 --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-768/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1237c5435098aaecc8f6895e7dce518b3d29b53badb7667153d839057287895d +size 15365 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-768/rng_state_1.pth b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-768/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..2c36924e07a8e74f86096af00cb5d20bda61f4c3 --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-768/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1fbdae1ff9d086ad954fc4a42ebf1839a2363ba48f4633f4440e7f3aa9afbf5 +size 15429 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-768/rng_state_2.pth b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-768/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..21b6cc1a649dff381b070ad3a2bde3cacbe2e425 --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-768/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5611d6d3e74b8e8618bbf874025b7aaab1fd1334013746d683e5c18a0d0a661a +size 15429 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-768/rng_state_3.pth b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-768/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..cf446e9f6d72bf26db589e838e947a17514b35ac --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-768/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9e8925fb8e2c5dfec02ecac085b3308cbe265d693c63c595d7b9fd98f890a65 +size 15429 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-768/scheduler.pt b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-768/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..ba0371866ff4c56375788d8e6b6ac204eca2f3b8 --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-768/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c26f336522cb69594b3952d10c9ee7899a17aa4a8eeeb9d1b384b971fa4c183 +size 1465 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-768/training_args.bin b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-768/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..28b57c2433d1f782fd9d6a2d566eacd7c01306ca --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-768/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6e763c53379e58f5e941c941cb9ff1e9ea6ce682340ae670fa6af4ad661a269 +size 8849 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-832/adapter_model.safetensors b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-832/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a9578f56036d18a2b3f98de78887ba63477373e2 --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-832/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c7959a5f477a30cc71edb3ff3703b096a2529978c683465404e410256825466 +size 49582616 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-832/rng_state_0.pth b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-832/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..fb9cb6b57739c0247415a40cf2e34a7d619cf246 --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-832/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5fb350c7e9334c6ea9e1c3258013a4274330d6be0f529db26c6e22a008f0450 +size 15365 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-832/rng_state_1.pth b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-832/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..4b8f9a507d6a13fc3962350e6aa55afb9efbfd16 --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-832/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d65e20a65ab11f549aa65873ac0ababfe66d20a9fcd83ec807000b36b03b591 +size 15429 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-832/rng_state_2.pth b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-832/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..85b8c7827b150120f3f0b3099ca46e6c3d7ddea4 --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-832/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:814212514fa074c0fa4fb1bb079cbd1892216529fa6c4d3a38ea64bc643e1fb4 +size 15429 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-832/rng_state_3.pth b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-832/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..61ba8e17f18120606b3dbb94902a61c27c32617d --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-832/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fac9b5c5f54f8fcfd099bdd0b0030a8a7890f4e50d3648b7463dbcd8293b4b96 +size 15429 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-832/scheduler.pt b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-832/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..8718467d126ce6bdbd53d0dbdd54da4de1ff11bf --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-832/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0d2ef8130fc98df19a3863a629f0a8a22986faed3b54d90a56462143208d671 +size 1465 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-832/training_args.bin b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-832/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..28b57c2433d1f782fd9d6a2d566eacd7c01306ca --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-832/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6e763c53379e58f5e941c941cb9ff1e9ea6ce682340ae670fa6af4ad661a269 +size 8849 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-896/adapter_model.safetensors b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-896/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3f011e8131a2e90779066319462750b4922c7c7b --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-896/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:044554ccfcd531b282f85c9b900e32624b8b5ef72a5e70f0a3acda4caceb8694 +size 49582616 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-896/rng_state_0.pth b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-896/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..5a4a93d5dc1b1426eedfeedbe92f5fbf101ddea7 --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-896/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2b2eca776509a1ddd2071be8d5ed145c4105f1b2652bf329c32941f9e8bf642 +size 15365 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-896/rng_state_1.pth b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-896/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..74da6151babb23a05cc3605ecade737576107e0a --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-896/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab7d3bb1d873ec80b3719fe248f92dcd3cd5618bb0950c5678dc84718dfb2f5c +size 15429 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-896/rng_state_2.pth b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-896/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..e081d26b1a7cdc444ff129cb1abc633f9ccc8d1b --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-896/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e57e911d37bbabc5be3e223c484cd1093fed69b92722aa523700c61f30867868 +size 15429 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-896/rng_state_3.pth b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-896/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..b6ab4bd9c5c4fe8b73a4713bd01b5d4b1a5f450b --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-896/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8475c4f2af107b33701d1074f66608a1811ea44d9db1c04d221c69182e36cb57 +size 15429 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-896/scheduler.pt b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-896/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..5b4ecb0ccba616e482f4a3ec4b8e0a53368e6fbf --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-896/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8bfb7bfa2c34c711580edf233de0f324b5ef962a780aa91f27b4eb576e2588ab +size 1465 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-960/adapter_model.safetensors b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-960/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1af90df55251011fdfd83af020cd5d5ef8e65286 --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-960/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1d1748236e23f20cea6b6b188f6ef0bc068576018c625c1ba5f49753d2c450b +size 49582616 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-960/rng_state_0.pth b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-960/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..95c55d230091d3c469d6b92a2e6a451eaa64ca89 --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-960/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:62ee796bb806a9b3aeba4284675c47887b249a3f525c95860d34ac90f23618ec +size 15365 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-960/rng_state_2.pth b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-960/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..cbd07a0c0fe18d4c685355bba9dedd19a1354d8b --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-960/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eac3f1be31120ff69c6651e8c0121a7f5170c83455d38c45d573a0cabb50098d +size 15429 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-960/rng_state_3.pth b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-960/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..f9731cf808cba6a13f257d8786723950ef0b14ee --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-960/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b77ad1651ad09f6a33218e7cd557b77627064230439d1c3b20451e9fcc3ae0d +size 15429 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/tokenizer.json b/dapo_milora_qwen2_5_1_5b_20251126_224006/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..1a2db243e47cbc113f6b2ddcc388aeeb8fe1a94c --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893 +size 11422778 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/training_args.bin b/dapo_milora_qwen2_5_1_5b_20251126_224006/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..28b57c2433d1f782fd9d6a2d566eacd7c01306ca --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6e763c53379e58f5e941c941cb9ff1e9ea6ce682340ae670fa6af4ad661a269 +size 8849 diff --git a/dapo_miss_openmath_20251129_124147/checkpoint-1024/adapter_model.safetensors b/dapo_miss_openmath_20251129_124147/checkpoint-1024/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..69c0673620e32c6fc4bfa5cdf7a315d568784d03 --- /dev/null +++ b/dapo_miss_openmath_20251129_124147/checkpoint-1024/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:991ef4b722675ae8be8e5833f96dcb3d9421737584f7a872440e7996bfca90cc +size 36981856 diff --git a/dapo_miss_openmath_20251129_124147/checkpoint-1024/tokenizer.json b/dapo_miss_openmath_20251129_124147/checkpoint-1024/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..51ebb3ba93988c73bbd83a3c163a14343fbc5b06 --- /dev/null +++ b/dapo_miss_openmath_20251129_124147/checkpoint-1024/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c5ae00e602b8860cbd784ba82a8aa14e8feecec692e7076590d014d7b7fdafa +size 11421896 diff --git a/dapo_miss_openmath_20251129_124147/checkpoint-128/tokenizer.json b/dapo_miss_openmath_20251129_124147/checkpoint-128/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..51ebb3ba93988c73bbd83a3c163a14343fbc5b06 --- /dev/null +++ b/dapo_miss_openmath_20251129_124147/checkpoint-128/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c5ae00e602b8860cbd784ba82a8aa14e8feecec692e7076590d014d7b7fdafa +size 11421896 diff --git a/dapo_miss_openmath_20251129_124147/checkpoint-192/tokenizer.json b/dapo_miss_openmath_20251129_124147/checkpoint-192/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..51ebb3ba93988c73bbd83a3c163a14343fbc5b06 --- /dev/null +++ b/dapo_miss_openmath_20251129_124147/checkpoint-192/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c5ae00e602b8860cbd784ba82a8aa14e8feecec692e7076590d014d7b7fdafa +size 11421896 diff --git a/dapo_miss_openmath_20251129_124147/checkpoint-256/global_step256/mp_rank_00_model_states.pt b/dapo_miss_openmath_20251129_124147/checkpoint-256/global_step256/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ea0b05515a6de090e8acddc76e7fe61992cd5f1a --- /dev/null +++ b/dapo_miss_openmath_20251129_124147/checkpoint-256/global_step256/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7889a3e8d910baa2e0c4ba24aaf409e6b99c555359ebc4df74b9259b03cac4df +size 503979621 diff --git a/dapo_miss_openmath_20251129_124147/checkpoint-256/rng_state_0.pth b/dapo_miss_openmath_20251129_124147/checkpoint-256/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..cf8d72b79a159f6310f06a25626c9dd335dc8bb3 --- /dev/null +++ b/dapo_miss_openmath_20251129_124147/checkpoint-256/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35f93ead41d4ef62221e0c009f14e5d83e499b15b3879beb949f8dffabd96557 +size 15365 diff --git a/dapo_miss_openmath_20251129_124147/checkpoint-256/rng_state_1.pth b/dapo_miss_openmath_20251129_124147/checkpoint-256/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..013eb5a0e4e7355598eeceab46533a3a8e2a4e14 --- /dev/null +++ b/dapo_miss_openmath_20251129_124147/checkpoint-256/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4da38ef05cdba29c3abc75c0bccac0cf7b78cc2c28af989b292fe8a713b4583 +size 15429 diff --git a/dapo_miss_openmath_20251129_124147/checkpoint-256/rng_state_3.pth b/dapo_miss_openmath_20251129_124147/checkpoint-256/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..0c0da0606c2b648bd62efd76d254fc369a1abb82 --- /dev/null +++ b/dapo_miss_openmath_20251129_124147/checkpoint-256/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c574d50a5ea08ea67e257c54b9069696c710c330918ef4ea347f9be4dd42536 +size 15429 diff --git a/dapo_miss_openmath_20251129_124147/checkpoint-256/tokenizer.json b/dapo_miss_openmath_20251129_124147/checkpoint-256/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..51ebb3ba93988c73bbd83a3c163a14343fbc5b06 --- /dev/null +++ b/dapo_miss_openmath_20251129_124147/checkpoint-256/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c5ae00e602b8860cbd784ba82a8aa14e8feecec692e7076590d014d7b7fdafa +size 11421896 diff --git a/dapo_miss_openmath_20251129_124147/checkpoint-256/training_args.bin b/dapo_miss_openmath_20251129_124147/checkpoint-256/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..4aaf77970b3dff8064090e296d624d3538978ae9 --- /dev/null +++ b/dapo_miss_openmath_20251129_124147/checkpoint-256/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c5c215d84703cfc98ad11de2d9f07cdf4b5dc3343d7447f227ef9ac39f64c06 +size 8849 diff --git a/dapo_miss_openmath_20251129_124147/checkpoint-320/rng_state_0.pth b/dapo_miss_openmath_20251129_124147/checkpoint-320/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..d77a53f83a6214858335f74b02cf9ab5d5ac7632 --- /dev/null +++ b/dapo_miss_openmath_20251129_124147/checkpoint-320/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:240edc12d7493f39db7b3b16a2b016aed8fb44e8502540fbd641bbef8e5069b0 +size 15365 diff --git a/dapo_miss_openmath_20251129_124147/checkpoint-320/rng_state_1.pth b/dapo_miss_openmath_20251129_124147/checkpoint-320/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..f0d3fdbcad2d095e54e34e3d60f3f7a3abff64d9 --- /dev/null +++ b/dapo_miss_openmath_20251129_124147/checkpoint-320/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12284711c61455d590f69da9914e94bfa549a1dd25aab48ff88bf1871a53ede5 +size 15429 diff --git a/dapo_miss_openmath_20251129_124147/checkpoint-320/rng_state_2.pth b/dapo_miss_openmath_20251129_124147/checkpoint-320/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..f13c11775a3084d1e62b086db0fd81dc2e194b56 --- /dev/null +++ b/dapo_miss_openmath_20251129_124147/checkpoint-320/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d79769d75139aac2abc4ae83204d598b48635cfd83c99d85281e3c22450cf06 +size 15429 diff --git a/dapo_miss_openmath_20251129_124147/checkpoint-320/rng_state_3.pth b/dapo_miss_openmath_20251129_124147/checkpoint-320/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..028b864fc5e00f3c548030044ce083b716f2d2eb --- /dev/null +++ b/dapo_miss_openmath_20251129_124147/checkpoint-320/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48184016d5ef1377bcc266a31d7cb60418a3ae682a24b7b1ff87b3ec33621098 +size 15429 diff --git a/dapo_miss_openmath_20251129_124147/checkpoint-320/scheduler.pt b/dapo_miss_openmath_20251129_124147/checkpoint-320/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..0b635ce1666c50e816d388484f117d6c351b92d3 --- /dev/null +++ b/dapo_miss_openmath_20251129_124147/checkpoint-320/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da013ae0b2b98d7666c2dc2fe7c1c09f26c72a818d58bd9b5b49a1d1f432bd5a +size 1465 diff --git a/dapo_miss_openmath_20251129_124147/checkpoint-320/training_args.bin b/dapo_miss_openmath_20251129_124147/checkpoint-320/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..4aaf77970b3dff8064090e296d624d3538978ae9 --- /dev/null +++ b/dapo_miss_openmath_20251129_124147/checkpoint-320/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c5c215d84703cfc98ad11de2d9f07cdf4b5dc3343d7447f227ef9ac39f64c06 +size 8849 diff --git a/dapo_miss_openmath_20251129_124147/checkpoint-384/global_step384/mp_rank_00_model_states.pt b/dapo_miss_openmath_20251129_124147/checkpoint-384/global_step384/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3fabb364333488ac8b1fb0703470154216b5870a --- /dev/null +++ b/dapo_miss_openmath_20251129_124147/checkpoint-384/global_step384/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa1f33ea0713dfb9747e8afc5e84a80584e5dab923d444e768fd7f5b1edcf0aa +size 503979621 diff --git a/dapo_miss_openmath_20251129_124147/checkpoint-384/rng_state_0.pth b/dapo_miss_openmath_20251129_124147/checkpoint-384/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..8e419235343a21fb399181bb3d24f89e7c398f03 --- /dev/null +++ b/dapo_miss_openmath_20251129_124147/checkpoint-384/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f61e755db934fee40336e46d34a606cd01a87c5d1f5ad3d340c13a512510ac2 +size 15365 diff --git a/dapo_miss_openmath_20251129_124147/checkpoint-384/rng_state_1.pth b/dapo_miss_openmath_20251129_124147/checkpoint-384/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..6f3a9f875cce5f7d9029f1bd10e5d2a08c58af7b --- /dev/null +++ b/dapo_miss_openmath_20251129_124147/checkpoint-384/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b1b904d0cfa007a2eb464836a89608da43fcb365108dbfb1606eb5cc0fc8e7f +size 15429 diff --git a/dapo_miss_openmath_20251129_124147/checkpoint-384/rng_state_2.pth b/dapo_miss_openmath_20251129_124147/checkpoint-384/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..0d0cb2a040647d3ec62c9c92aabe8f81f2f8beda --- /dev/null +++ b/dapo_miss_openmath_20251129_124147/checkpoint-384/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1466478ba2cfbbd4fca78455edb282d8e8ad2dce9fb669364af89145aeb14e46 +size 15429 diff --git a/dapo_miss_openmath_20251129_124147/checkpoint-384/rng_state_3.pth b/dapo_miss_openmath_20251129_124147/checkpoint-384/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..17ed8e30c26c76e9f571fb5a3676d94a309a2aea --- /dev/null +++ b/dapo_miss_openmath_20251129_124147/checkpoint-384/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22a94909157da27243e314c756de79aa42c3d9639b0accceb46e7651c77c6076 +size 15429 diff --git a/dapo_miss_openmath_20251129_124147/checkpoint-384/scheduler.pt b/dapo_miss_openmath_20251129_124147/checkpoint-384/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..e35447364346dd4e48ff2912c9630fa0d550dd81 --- /dev/null +++ b/dapo_miss_openmath_20251129_124147/checkpoint-384/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a73b3132edc693a316dd18b0560b36c0fb0501d1030453a31a1309122a6bf7c +size 1465 diff --git a/dapo_miss_openmath_20251129_124147/checkpoint-384/training_args.bin b/dapo_miss_openmath_20251129_124147/checkpoint-384/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..4aaf77970b3dff8064090e296d624d3538978ae9 --- /dev/null +++ b/dapo_miss_openmath_20251129_124147/checkpoint-384/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c5c215d84703cfc98ad11de2d9f07cdf4b5dc3343d7447f227ef9ac39f64c06 +size 8849 diff --git a/dapo_miss_openmath_20251129_124147/checkpoint-448/rng_state_0.pth b/dapo_miss_openmath_20251129_124147/checkpoint-448/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..122627ad9a31b5f86dd1297c3af0a5d13ed3091b --- /dev/null +++ b/dapo_miss_openmath_20251129_124147/checkpoint-448/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75cc4b7c465aa9e465fbb5ba70f9a00235cd191d667ea38e78725791e19d1dda +size 15365 diff --git a/dapo_miss_openmath_20251129_124147/checkpoint-448/rng_state_3.pth b/dapo_miss_openmath_20251129_124147/checkpoint-448/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..eee5c6c08b3e154f1240bf18eac9cc630e7c5f24 --- /dev/null +++ b/dapo_miss_openmath_20251129_124147/checkpoint-448/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:185b7ed4b531a95aba13ce2e892bf611224ecd41b70e1223b6352e8c490570d7 +size 15429 diff --git a/dapo_miss_openmath_20251129_124147/checkpoint-640/global_step640/mp_rank_00_model_states.pt b/dapo_miss_openmath_20251129_124147/checkpoint-640/global_step640/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f27cf1a6f08415a4a9b089aa8985e5c0ae2a586f --- /dev/null +++ b/dapo_miss_openmath_20251129_124147/checkpoint-640/global_step640/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1f648f55140b171a35b0582ae0521bfc4a54b3a11661313ba64395101237d3c +size 503979621 diff --git a/dapo_miss_openmath_20251129_124147/checkpoint-832/global_step832/mp_rank_00_model_states.pt b/dapo_miss_openmath_20251129_124147/checkpoint-832/global_step832/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a1b5d9446d32b1ab8eee4f0b3dc1139b8fcd3cd8 --- /dev/null +++ b/dapo_miss_openmath_20251129_124147/checkpoint-832/global_step832/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:963e8156dafe709695fec7b0e1c0ec30224f0af7f9730c79e688fe4576c1878d +size 503979621 diff --git a/dapo_miss_openmath_20251129_124147/checkpoint-896/global_step896/mp_rank_00_model_states.pt b/dapo_miss_openmath_20251129_124147/checkpoint-896/global_step896/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..441be3bf6ef939a296dc6dbc172033f1685463d2 --- /dev/null +++ b/dapo_miss_openmath_20251129_124147/checkpoint-896/global_step896/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:57e956bcdd999c84cfabb5d366eaa0004f8ff1be89868fe6024c96eb2ce4c698 +size 503979621 diff --git a/dapo_miss_qwen2_5_1_5b_20251124_220354/checkpoint-704/global_step704/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/dapo_miss_qwen2_5_1_5b_20251124_220354/checkpoint-704/global_step704/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f17ce9e59d648413328320ae4b1cc6de67800060 --- /dev/null +++ b/dapo_miss_qwen2_5_1_5b_20251124_220354/checkpoint-704/global_step704/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05e8e4cd192dac47bffdd7c07297813b215af4dcd37960b640658f6e6818c294 +size 9639365 diff --git a/dapo_miss_qwen2_5_1_5b_20251124_220354/checkpoint-768/global_step768/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/dapo_miss_qwen2_5_1_5b_20251124_220354/checkpoint-768/global_step768/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2cffa438f1193167ce3cc6f9961dff852ad47351 --- /dev/null +++ b/dapo_miss_qwen2_5_1_5b_20251124_220354/checkpoint-768/global_step768/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b4e42cc82581211da92ecaf9133f22d54386e12b31e9bacc0b672e03e83f15d +size 9639365 diff --git a/dapo_miss_qwen2_5_1_5b_20251124_220354/checkpoint-832/global_step832/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/dapo_miss_qwen2_5_1_5b_20251124_220354/checkpoint-832/global_step832/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..47d9d4bb4919c9faa8f46eb4de287184c6ab7121 --- /dev/null +++ b/dapo_miss_qwen2_5_1_5b_20251124_220354/checkpoint-832/global_step832/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94c59dfbdc28ea05486df8bbff1cc5c1e872b66fd29afc47bd8e18bebbc2d397 +size 9639365 diff --git a/dapo_miss_qwen2_5_1_5b_20251124_220354/checkpoint-896/global_step896/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/dapo_miss_qwen2_5_1_5b_20251124_220354/checkpoint-896/global_step896/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed4259da9801a5f562373f864122f203abc29d1f --- /dev/null +++ b/dapo_miss_qwen2_5_1_5b_20251124_220354/checkpoint-896/global_step896/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23dd2e7b02dae082254e158a182e657a97cd58a630881345f10cbef5437cf3f9 +size 9639365 diff --git a/dapo_miss_qwen2_5_1_5b_20251124_220354/checkpoint-896/global_step896/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/dapo_miss_qwen2_5_1_5b_20251124_220354/checkpoint-896/global_step896/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a3cfcf1e5a702ba8d68fe2cd257341d442c9a12e --- /dev/null +++ b/dapo_miss_qwen2_5_1_5b_20251124_220354/checkpoint-896/global_step896/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ed068bbee67de4cc55d0816174a02a03fd0ff4cddde4c4260a9f48f99744200 +size 9639365 diff --git a/dapo_miss_qwen2_5_1_5b_20251124_220354/checkpoint-896/global_step896/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/dapo_miss_qwen2_5_1_5b_20251124_220354/checkpoint-896/global_step896/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a1c148764262d73b160cd7cf2d21279a3ae85faf --- /dev/null +++ b/dapo_miss_qwen2_5_1_5b_20251124_220354/checkpoint-896/global_step896/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b55ce858421cc705bc7a94ca97fbbbd77b400ab8651ec74df312488f7e7464d +size 9639365 diff --git a/dapo_miss_qwen2_5_1_5b_20251124_220354/checkpoint-896/tokenizer.json b/dapo_miss_qwen2_5_1_5b_20251124_220354/checkpoint-896/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..1a2db243e47cbc113f6b2ddcc388aeeb8fe1a94c --- /dev/null +++ b/dapo_miss_qwen2_5_1_5b_20251124_220354/checkpoint-896/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893 +size 11422778 diff --git a/dapo_miss_qwen2_5_1_5b_20251124_220354/checkpoint-960/global_step960/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/dapo_miss_qwen2_5_1_5b_20251124_220354/checkpoint-960/global_step960/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c05b87e5370add782603852001588246f6053d7c --- /dev/null +++ b/dapo_miss_qwen2_5_1_5b_20251124_220354/checkpoint-960/global_step960/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5bd5a140cf6ada4221351f3062098244415e35985281db3bbdeb240b2a5800e2 +size 9639365 diff --git a/dapo_miss_qwen2_5_1_5b_20251124_220354/checkpoint-960/global_step960/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/dapo_miss_qwen2_5_1_5b_20251124_220354/checkpoint-960/global_step960/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d9125a4c8d7b67d34cce2edcd6511e4ed200045 --- /dev/null +++ b/dapo_miss_qwen2_5_1_5b_20251124_220354/checkpoint-960/global_step960/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f3357a219dfaf1dd94e0bad288327802c334de2dfb9c0741fee63b73381a4bb +size 9639365 diff --git a/dapo_miss_qwen2_5_1_5b_20251124_220354/checkpoint-960/global_step960/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/dapo_miss_qwen2_5_1_5b_20251124_220354/checkpoint-960/global_step960/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c587c154a6f7197f41146f7f9b2d7843bbde6d23 --- /dev/null +++ b/dapo_miss_qwen2_5_1_5b_20251124_220354/checkpoint-960/global_step960/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39b9f4651f66fe1b951ac2f1e8980d80c2005c976e4dab6ee82512dd6bb6890f +size 9639365 diff --git a/dapo_miss_qwen2_5_1_5b_20251124_220354/checkpoint-960/tokenizer.json b/dapo_miss_qwen2_5_1_5b_20251124_220354/checkpoint-960/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..1a2db243e47cbc113f6b2ddcc388aeeb8fe1a94c --- /dev/null +++ b/dapo_miss_qwen2_5_1_5b_20251124_220354/checkpoint-960/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893 +size 11422778 diff --git a/dapo_miss_qwen_1_5b/checkpoint-704/adapter_model.safetensors b/dapo_miss_qwen_1_5b/checkpoint-704/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..168c33d47bdeb46eb1e50b02c81208574d26b6e8 --- /dev/null +++ b/dapo_miss_qwen_1_5b/checkpoint-704/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a53890bf561bc59ac16af1d7ee75dab0e78dc5516d65e41a7153288150608ca +size 6429840 diff --git a/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-128/rng_state_1.pth b/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-128/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..53ff049360f4a6aa87233d505ea52895fe62613d --- /dev/null +++ b/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-128/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:372d5b456046982276bafc61a93746f11712c7f6b3c057fa0f6617e00cb0baa6 +size 15429 diff --git a/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-128/rng_state_2.pth b/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-128/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..aeb8c41af19ac5c3ddcff206f8791bc080285c4e --- /dev/null +++ b/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-128/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4dfc39f580dce07e3b16254f7881d9158d69149a4af0c7844e53e87b45a6eb80 +size 15429 diff --git a/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-128/rng_state_3.pth b/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-128/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..cc89a3d8f233556b43085073a9699778857b43c2 --- /dev/null +++ b/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-128/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27285e3d74c329c92babab7c27a3b8e3fe250d867ac3f9379293d87b53dfa959 +size 15429 diff --git a/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-128/scheduler.pt b/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-128/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d08ae64295b57090bbaa5d6676253533d838873 --- /dev/null +++ b/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-128/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a72d1751ecd37a23ecd20bd8b9260f394c2f370cb5db8d203bad7d01395f4fb8 +size 1465 diff --git a/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-192/rng_state_0.pth b/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-192/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..c988580f69ad70d1cd31014df8d0f8cf94f0135c --- /dev/null +++ b/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-192/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96f18dcc89bb758f0e3afcda4d10abcf0d3388d2a05a71dfd04cc9a9138f0561 +size 15365 diff --git a/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-192/rng_state_1.pth b/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-192/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..7030e142c6ff3e33664f137d9bd3d416d3c74685 --- /dev/null +++ b/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-192/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ad2f111b1f6c656455a17b609352106e8faa4604818d46034f570b66ed0fc67 +size 15429 diff --git a/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-192/rng_state_2.pth b/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-192/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..d29667b8a742c48bcf4f9735ebf060a833ff29b4 --- /dev/null +++ b/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-192/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f53882efbb453a30612f370ce1a891047d7f5a1d80929bdc1b948ab36cf8483 +size 15429 diff --git a/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-192/scheduler.pt b/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-192/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb4e8900ca74d271df161df3e78c5e3163d3ca2c --- /dev/null +++ b/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-192/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ac63e93328a0491bc31c5b67747712626467b0c1fab68bd8f3a90d2ffc2d318 +size 1465 diff --git a/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-192/training_args.bin b/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-192/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..92ac30421683b0459d8eeecb3918cb3673f85818 --- /dev/null +++ b/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-192/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84b3c5daaaf9864e2e038330c84861763b6ffc86d92b23f4c6e5428fc51e6cca +size 8849 diff --git a/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-256/rng_state_0.pth b/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-256/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..4b82e9a3ee5a8d61f460b9edb35e1e4c9eeeca44 --- /dev/null +++ b/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-256/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6404467ba9860054b25938e1bb7187c9a7fa9191fffd7ba6302fd35b71818f7e +size 15365 diff --git a/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-256/rng_state_1.pth b/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-256/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..5c7d7464bf4c6babd92ef09b9cd34661660490b8 --- /dev/null +++ b/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-256/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bba4098d17a968e6bf5c5f35d7b31d3190bdcd314afc34ed003989248023ab2a +size 15429 diff --git a/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-256/rng_state_2.pth b/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-256/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..6c10f3eb242830eebd9a7adcfefe9915721fefd6 --- /dev/null +++ b/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-256/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:abaf94e919387a2467131f0ef003fed1fce0cb573d1f27191686c0ca58b9a176 +size 15429 diff --git a/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-256/rng_state_3.pth b/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-256/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..1b4c89fa6505ba720f7a496e48abac4ff6676aae --- /dev/null +++ b/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-256/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3a2236756222afbe1dea0464ff22807785c9a085ee8bedb9ccdc784be273f5c +size 15429 diff --git a/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-256/scheduler.pt b/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-256/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..5da175406e5951634027623c46687436be96a222 --- /dev/null +++ b/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-256/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8495f527d2ae384d255f961a1b604892e1f5459d17e99146a7b64167ecb9365 +size 1465 diff --git a/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-256/training_args.bin b/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-256/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..92ac30421683b0459d8eeecb3918cb3673f85818 --- /dev/null +++ b/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-256/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84b3c5daaaf9864e2e038330c84861763b6ffc86d92b23f4c6e5428fc51e6cca +size 8849 diff --git a/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-320/rng_state_0.pth b/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-320/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..49eab54f0bc5cbf4387d3bc2ec3c47076111b74a --- /dev/null +++ b/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-320/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a452770aa4303e629f1cbb5b4fea131553acdbf3508ba5a9f9cd4b7cbada148e +size 15365 diff --git a/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-320/rng_state_1.pth b/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-320/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..cd143585c35992c37d42324cda77e297aa9e2f85 --- /dev/null +++ b/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-320/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:432fba88a6a29ccc5812350abba1008c26fb5f1965ce499123f65dbcb5d99d16 +size 15429 diff --git a/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-320/rng_state_2.pth b/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-320/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..bc3c30251af31f07923400c665be67361d7a277c --- /dev/null +++ b/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-320/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c888a96defc202a0822d13e2fc75c7d544f2374791cc71124220c91408764f4 +size 15429 diff --git a/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-320/rng_state_3.pth b/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-320/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..db9c1858c2831f02361574ea185a59efd64ba1c4 --- /dev/null +++ b/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-320/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17c8b9bee0fea20d9184fa22665d3e761693d2465a1e861e47ca55206b14beb6 +size 15429 diff --git a/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-320/scheduler.pt b/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-320/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..0b635ce1666c50e816d388484f117d6c351b92d3 --- /dev/null +++ b/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-320/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da013ae0b2b98d7666c2dc2fe7c1c09f26c72a818d58bd9b5b49a1d1f432bd5a +size 1465 diff --git a/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-320/training_args.bin b/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-320/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..92ac30421683b0459d8eeecb3918cb3673f85818 --- /dev/null +++ b/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-320/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84b3c5daaaf9864e2e038330c84861763b6ffc86d92b23f4c6e5428fc51e6cca +size 8849 diff --git a/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-384/rng_state_0.pth b/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-384/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..ab7d2afdee98a552e3472279a58d83c11cf7421f --- /dev/null +++ b/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-384/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dcd67e15cd7ff45d7d4ee68c8959ed0ce167fedc2a3f9097cf08d113b114627e +size 15365 diff --git a/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-384/rng_state_1.pth b/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-384/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..a1a216f178bf0bfebd2a891d48e8b5f0ef7403c5 --- /dev/null +++ b/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-384/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80161a8bd85ace03339215bc7ffb23ed2e4b47e625e29c750d8db13ad9f12494 +size 15429 diff --git a/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-384/rng_state_2.pth b/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-384/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..13f9819ab0119a57843840121cd0dc89ef6ead59 --- /dev/null +++ b/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-384/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7bcef20f6f1d8141c99208ae8a7cd4dda3c4de422d8a1a293b76cbd15a8808d +size 15429 diff --git a/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-384/rng_state_3.pth b/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-384/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..fa873be3900ba63be2a102500ec079cf47ca02a8 --- /dev/null +++ b/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-384/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05e5c947e1b8dfe390f5ef77030e4e90e82e648791ba0f01d2630f47c4f8671d +size 15429 diff --git a/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-384/scheduler.pt b/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-384/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..e35447364346dd4e48ff2912c9630fa0d550dd81 --- /dev/null +++ b/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-384/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a73b3132edc693a316dd18b0560b36c0fb0501d1030453a31a1309122a6bf7c +size 1465 diff --git a/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-384/training_args.bin b/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-384/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..92ac30421683b0459d8eeecb3918cb3673f85818 --- /dev/null +++ b/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-384/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84b3c5daaaf9864e2e038330c84861763b6ffc86d92b23f4c6e5428fc51e6cca +size 8849 diff --git a/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-448/rng_state_0.pth b/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-448/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..a020061d2fcd8ebe763986580f2af8824f02c210 --- /dev/null +++ b/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-448/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e0207c33e158dedfc218ab734aaeb46f9fb54b63f134ee00f7348a184300b5a +size 15365 diff --git a/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-448/rng_state_1.pth b/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-448/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..2fd01270a1f55ff7c6a776e6ac3ca96c487747ce --- /dev/null +++ b/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-448/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9271dd4580b2d325e23db5e5503d54b31d3503778c89d5f065567e308f5959d +size 15429 diff --git a/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-448/rng_state_2.pth b/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-448/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..98d7fcb2a8c125e7d223449e6092c20a90a93ff6 --- /dev/null +++ b/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-448/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b27a6903fb341b3d4b77f576f6f653783ec26c7998faa5e81d3e2a5e904d03c7 +size 15429 diff --git a/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-448/rng_state_3.pth b/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-448/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..5616877b02df0f4e67b95bbc00e660f1c8cc13e3 --- /dev/null +++ b/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-448/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0bf7c61f5575c260d460edb4844b7bc9d03f66e77e3622f559e4b9216f275292 +size 15429 diff --git a/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-448/scheduler.pt b/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-448/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a39d5aae7a5de28bbf7c8e26531da9f7f0cda3e --- /dev/null +++ b/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-448/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89d50e6c2130ded251cbd3fb239e3a2e1e0564766292c69bfb4aa6ba0d973844 +size 1465 diff --git a/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-448/training_args.bin b/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-448/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..92ac30421683b0459d8eeecb3918cb3673f85818 --- /dev/null +++ b/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-448/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84b3c5daaaf9864e2e038330c84861763b6ffc86d92b23f4c6e5428fc51e6cca +size 8849 diff --git a/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-512/rng_state_0.pth b/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-512/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..535e1c4a645bb3d73e32829f34f7d4573aad49fb --- /dev/null +++ b/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-512/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5383acbbc156a1c04640d851833dd66b705a12721ea6b0b666c32946be449138 +size 15365 diff --git a/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-512/rng_state_1.pth b/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-512/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..255c1e2e9238661650d87c7d4302fb14fce55b31 --- /dev/null +++ b/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-512/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83bbd0cadf8f1e0202c5296585a3a1faa07ed2c6c5d5530232df141ae5bcfed7 +size 15429 diff --git a/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-512/rng_state_2.pth b/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-512/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..672f9a5916260ac3afeb0218efc22155af7bc42c --- /dev/null +++ b/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-512/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd8c675ce26db075422de140a5e27cae2b2fdd777f6486151d23e1dcb5efdd30 +size 15429 diff --git a/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-512/rng_state_3.pth b/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-512/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..bce3b21396802ef4792e68fdb06530010c9a289d --- /dev/null +++ b/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-512/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba8888ea8774c43cf4dcd8a11e850cd6f402417fbfc547b2daea831fb80c5100 +size 15429 diff --git a/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-512/scheduler.pt b/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-512/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..4800a9e5803399b265ffcab0af9c3fe980dbd948 --- /dev/null +++ b/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-512/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c0e61c4f166edd4bd232bd6fbefe6d67a5b7e00cb803d1741eac9a6d2b7b6ee +size 1465 diff --git a/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-512/training_args.bin b/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-512/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..92ac30421683b0459d8eeecb3918cb3673f85818 --- /dev/null +++ b/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-512/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84b3c5daaaf9864e2e038330c84861763b6ffc86d92b23f4c6e5428fc51e6cca +size 8849 diff --git a/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-576/rng_state_0.pth b/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-576/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..184396dae05e92756ebd1e2f7469ff03e0ccb454 --- /dev/null +++ b/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-576/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5cf0afccc02a451d0d7ca163a03eb87753febffd8e19ade13050a9951e7f9fd0 +size 15365 diff --git a/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-576/rng_state_2.pth b/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-576/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..a67b87220e05715eac718753d792db1db94d0b43 --- /dev/null +++ b/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-576/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9bc949e11634a45273ff1fe832efae68dddee34ecee487ee1cc922da94f4b933 +size 15429 diff --git a/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-576/rng_state_3.pth b/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-576/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..71c24f764f929f47eedcaf2be0a3ce06c94a53c6 --- /dev/null +++ b/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-576/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0f0622fbe544ddd3490d024372ffdaed053c8ed3c0f3836ce998ab8d5796f2a +size 15429 diff --git a/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-576/scheduler.pt b/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-576/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..454813a4990df191f6951cdef743cc653ff31f83 --- /dev/null +++ b/dapo_pissa_qwen2_5_1_5b_20251126_192154/checkpoint-576/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:105f4404298e62d6811a76a80078eaf19c435d835ba8926a324f78dfdc9fb5f1 +size 1465 diff --git a/dr_grpo_lora_20251129_132413/checkpoint-704/global_step704/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/dr_grpo_lora_20251129_132413/checkpoint-704/global_step704/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e8e96fa67162a079d6da58746c4e85be95f49eaa --- /dev/null +++ b/dr_grpo_lora_20251129_132413/checkpoint-704/global_step704/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a053415ee3bb869d7dbb62245eb74ac26a0badd7aecbdb5bcf91755caf8eca9 +size 55408773 diff --git a/dr_grpo_lora_20251129_132413/checkpoint-832/global_step832/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/dr_grpo_lora_20251129_132413/checkpoint-832/global_step832/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ba598e309a6c41df0ab846382dfdc725372e9ed9 --- /dev/null +++ b/dr_grpo_lora_20251129_132413/checkpoint-832/global_step832/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3c3a1e4bfe3e75c5d2ad3832be73b5cbbdabb15cea5023620af08b28a99b52d +size 55408837 diff --git a/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-320/global_step320/mp_rank_00_model_states.pt b/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-320/global_step320/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..55d6d3e69be1100e8103d40c98b11f5453d962e4 --- /dev/null +++ b/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-320/global_step320/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58f9e8a40fe0ae4ffff62008069d0fa303113e3256e26f54e2397dea1abee877 +size 3554268069 diff --git a/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-384/tokenizer.json b/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-384/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..1a2db243e47cbc113f6b2ddcc388aeeb8fe1a94c --- /dev/null +++ b/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-384/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893 +size 11422778 diff --git a/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-512/global_step512/mp_rank_00_model_states.pt b/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-512/global_step512/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c04c75e035655f22294098d4415b534263f1abdc --- /dev/null +++ b/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-512/global_step512/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60d68c13129aca88811cfb4b684ee9a39324db5c2a651a74fec3fc8da1de33e3 +size 3554268069 diff --git a/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-512/tokenizer.json b/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-512/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..1a2db243e47cbc113f6b2ddcc388aeeb8fe1a94c --- /dev/null +++ b/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-512/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893 +size 11422778 diff --git a/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-576/tokenizer.json b/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-576/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..1a2db243e47cbc113f6b2ddcc388aeeb8fe1a94c --- /dev/null +++ b/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-576/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893 +size 11422778 diff --git a/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-64/tokenizer.json b/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-64/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..1a2db243e47cbc113f6b2ddcc388aeeb8fe1a94c --- /dev/null +++ b/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-64/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893 +size 11422778 diff --git a/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-640/rng_state_1.pth b/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-640/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..766524f5f715e666e319508d3d9c050df62984d5 --- /dev/null +++ b/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-640/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a76dd5182fe8c3437b85aae769e8a257e4f4e42a70f83d05c7fe127be5b9382d +size 15429 diff --git a/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-640/tokenizer.json b/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-640/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..1a2db243e47cbc113f6b2ddcc388aeeb8fe1a94c --- /dev/null +++ b/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-640/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893 +size 11422778 diff --git a/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-704/rng_state_0.pth b/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-704/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..cec4203802618aecb62118011a2ec8c1702cde34 --- /dev/null +++ b/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-704/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92fb5848f45ebaa4b013a5fed3d33bec6863b0a96d9eb1713147e5dbf606d495 +size 15365 diff --git a/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-704/rng_state_1.pth b/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-704/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..345f4a5f2f847a73da50c6312906c34f0ef50549 --- /dev/null +++ b/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-704/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce5d0787918bed9be65292ed1573aacf9175465c034ff2de629a30c3c3064a42 +size 15429 diff --git a/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-704/rng_state_3.pth b/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-704/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..0c07015f42b6a73ba0f166cb8203e7d4a52abdcb --- /dev/null +++ b/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-704/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a66a4bdcc0cfbfc69d0ea6909a96898aa46d5dc74622534af1b410755528b9ff +size 15429 diff --git a/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-704/scheduler.pt b/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-704/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..803368fe8d0b3cb6e6799bdf4abca3b9da20afb6 --- /dev/null +++ b/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-704/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e08e08214a2d61baf7ba9977b1a3e7a56b0fbbf6718956f14b5f44f3e1d74381 +size 1465 diff --git a/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-704/training_args.bin b/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-704/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..aecb99b3f26384aee356780c931fbfecb9e94e92 --- /dev/null +++ b/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-704/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cbe5b31134a094422fde08c9d7fd4c7b9deb533ab123345f5a4814519decf5bb +size 8849 diff --git a/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-768/global_step768/mp_rank_00_model_states.pt b/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-768/global_step768/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a2a5298ada13bac8ebe423eee15af46643759d1 --- /dev/null +++ b/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-768/global_step768/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37d069b686209b237024b4ad959e65978a6d86a7b44dfcaf7122206df366b2f9 +size 3554268069 diff --git a/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-768/rng_state_0.pth b/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-768/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..9c917a5cbf6be9298e613d5aa7e4e96737b5405a --- /dev/null +++ b/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-768/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b5364417e965a53ed5a4749fcba08ef31cc2fd9eaefd3693ca1a4afb965da8c +size 15365 diff --git a/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-768/rng_state_1.pth b/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-768/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..428afc1dcd68576599011a622f3bc5184507966b --- /dev/null +++ b/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-768/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:612aace3ecdc2175c61101a98a7f7058e3885e89fe2c797af9016c944866921f +size 15429 diff --git a/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-768/rng_state_2.pth b/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-768/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..bac1171757e79c6adb143ddbf86b4d0650edf114 --- /dev/null +++ b/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-768/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9da357f3632f751784f807f4de12b43bbfdcbcf242eb10b2e33b816ca0942ef0 +size 15429 diff --git a/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-768/rng_state_3.pth b/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-768/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..8b72afb9968f39c8b6890109b80e74a3c434142c --- /dev/null +++ b/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-768/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9547fd44b513fae196ad405556c896b8895f7fd36c7c448aff2961f66e6ba99 +size 15429 diff --git a/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-768/scheduler.pt b/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-768/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..64fc77f63aa2aa8a8d0eaaa40da6b545740c0c91 --- /dev/null +++ b/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-768/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7d8785e96d2c77a396cb449178272c02f43aa0a9344d0f8b652208f432830c6 +size 1465 diff --git a/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-768/training_args.bin b/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-768/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..aecb99b3f26384aee356780c931fbfecb9e94e92 --- /dev/null +++ b/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-768/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cbe5b31134a094422fde08c9d7fd4c7b9deb533ab123345f5a4814519decf5bb +size 8849 diff --git a/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-832/global_step832/mp_rank_00_model_states.pt b/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-832/global_step832/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4f74a6ecd6c4d4f879bd43efba9ee884b5917192 --- /dev/null +++ b/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-832/global_step832/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bae32aea2f9506c75ccf5dcb2420ed7de5f0badc1ffca33b05237d98d302a526 +size 3554268069 diff --git a/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-832/rng_state_0.pth b/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-832/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..b7cb852c5e94fc6cea75715b31a40ab2f6163250 --- /dev/null +++ b/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-832/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5c7236855142637e565e69067e4ce37cdef60e649c9238e8d21eff343186bef +size 15365 diff --git a/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-832/rng_state_1.pth b/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-832/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..0e64a1a193be2f8dd0bd232b3cec1ebc1dc7febb --- /dev/null +++ b/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-832/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c810ab78eeaccc6dcf8138a45261edae7b953207b69da30709df9bc33ec36ad8 +size 15429 diff --git a/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-832/rng_state_3.pth b/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-832/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..499d8f62773b093692bea06752d04a991daaac44 --- /dev/null +++ b/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-832/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d567520565506fbeaab21cd19a35baf4f6a95606247a4e89fecdd5d9262a9afe +size 15429 diff --git a/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-832/scheduler.pt b/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-832/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..6b4ce1daf6d63b6a1d8ea1ae7d6c3266903eb013 --- /dev/null +++ b/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-832/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0027525fc20783fb2f0316795b2fa9e123690ae366ad077f4dc95ac19e8eae5 +size 1465 diff --git a/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-896/rng_state_0.pth b/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-896/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..78a00a4b168d4cefa3aa398b6b2fc589d9862d3b --- /dev/null +++ b/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-896/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9df096960f2be83a623ebd71aa4ae82abea294b6225f89b1c7ce0c35243318a3 +size 15365 diff --git a/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-896/rng_state_3.pth b/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-896/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..28d4de5ec1d156d71c7812c37810cd603c003759 --- /dev/null +++ b/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-896/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20d284170d11762a33e2b51352f514656cc23dbeea9e41e63bde3a829932c2ee +size 15429