diff --git a/.gitattributes b/.gitattributes index 7a4a5d479ee55f6ff96202c11b62f95564dc42bf..8c88070d66a30ef5071f8725ea7af848a3df2395 100644 --- a/.gitattributes +++ b/.gitattributes @@ -76,3 +76,71 @@ dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-64/tokenizer.json filter=lfs d dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-512/tokenizer.json filter=lfs diff=lfs merge=lfs -text dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-192/tokenizer.json filter=lfs diff=lfs merge=lfs -text dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-704/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-832/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-768/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-960/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-1024/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_lora_r16_qwen2_5_3b_20251124_104900/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-128/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-896/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-192/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-576/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-64/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-512/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-640/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-704/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-448/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-384/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-64/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-640/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-704/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-768/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-832/tokenizer.json filter=lfs diff=lfs merge=lfs -text +grpo_full_qwen2_5_3b_20251121_111716/checkpoint-832/tokenizer.json filter=lfs diff=lfs merge=lfs -text +grpo_full_qwen2_5_3b_20251121_111716/checkpoint-960/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-832/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-704/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_lora_lr5_20251129_222821/checkpoint-512/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-896/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_lora_lr5_20251129_222821/checkpoint-448/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_lora_lr5_20251129_222821/checkpoint-128/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_lora_lr5_20251129_222821/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-960/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_lora_lr5_20251129_222821/checkpoint-384/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_lora_lr5_20251129_222821/checkpoint-320/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_lora_lr5_20251129_222821/checkpoint-192/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_lora_lr5_20251129_222821/checkpoint-256/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_lora_lr5_20251129_222821/checkpoint-1024/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_lora_lr5_20251129_222821/checkpoint-576/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_lora_lr5_20251129_222821/checkpoint-640/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_lora_lr5_20251129_222821/checkpoint-704/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_lora_lr5_20251129_222821/checkpoint-768/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_lora_lr5_20251129_222821/checkpoint-64/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-192/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-384/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-448/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-512/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-640/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-768/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_lora_lr5_20251129_222821/checkpoint-832/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_lora_qwen2_5_3b_20251129_022228/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-1024/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-128/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_lora_lr5_20251129_222821/checkpoint-896/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_lora_lr5_20251129_222821/checkpoint-960/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-192/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-256/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-320/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-320/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-384/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-512/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-576/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-640/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-64/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-704/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-832/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-768/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-896/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-960/tokenizer.json filter=lfs diff=lfs merge=lfs -text +dapo_miss_openmath_20251129_124147/tokenizer.json filter=lfs diff=lfs merge=lfs -text +grpo_full_qwen2_5_3b_20251121_111716/checkpoint-896/tokenizer.json filter=lfs diff=lfs merge=lfs -text diff --git a/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-512/adapter_model.safetensors b/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-512/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5366dee97746a385fc5c8f87253dee7f0b31cbb0 --- /dev/null +++ b/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-512/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17ebbc5e855944009d1140db0720ddd5916113dd3e9fd5a1fd249dd513e84690 +size 75228904 diff --git a/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-512/global_step512/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-512/global_step512/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd26da9f7bf4c8daeb7d8a4795f103ca14bdb806 --- /dev/null +++ b/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-512/global_step512/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0efc20e1b84161371a394fd09f5497707cac93ee7ef9264bd043f190ee3718fa +size 112744453 diff --git a/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-512/global_step512/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-512/global_step512/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..66a4a52e44ee243df92c6a6acba5317c8d310fda --- /dev/null +++ b/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-512/global_step512/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a176b2fb7fdb92a42e78601018de78f4ef01901147c1971ca690a8e3a68e59d2 +size 112744517 diff --git a/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-512/global_step512/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-512/global_step512/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7765a93b8f4a296fddbe8a369343bd320a5e781a --- /dev/null +++ b/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-512/global_step512/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b60fcbf8df2c1283ef750fbd8f3ad2ccba6ddc7ef7e694f554147d6354fa105 +size 112744581 diff --git a/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-512/global_step512/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-512/global_step512/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..16735e3cce42bbac0752e4b25dacc64b398fd8ed --- /dev/null +++ b/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-512/global_step512/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a799d79f923f9620e1b5db896d3a63786c2d253c128f8bfa345b6242f769f787 +size 112744581 diff --git a/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-576/global_step576/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-576/global_step576/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..93dad8824c6442f95edf3225f5208edf8ba97b8d --- /dev/null +++ b/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-576/global_step576/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ca4e41cd3d43a3404c13226231ae13a8fbed17462ba29367c0f9a3985f67d58 +size 112744453 diff --git a/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-576/global_step576/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-576/global_step576/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..31b7e6cd0759c8e7d68885291d4655676f6d583b --- /dev/null +++ b/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-576/global_step576/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de488a16cc358f58e3a483833bfec9b54dbe86c2fa99c7f87b3d71ba358fadfc +size 112744517 diff --git a/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-576/global_step576/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-576/global_step576/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2abdf1594d49348b417005f3e612dddb1f60dee6 --- /dev/null +++ b/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-576/global_step576/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b04e00548439d26f0493e677f3f2a56ec81b0086de0d9d1932754d3ac989e275 +size 112744581 diff --git a/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-576/global_step576/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-576/global_step576/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ee98c5e548c5356a9d0251dc18419a8ecb8af4fd --- /dev/null +++ b/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-576/global_step576/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f5c7d0c13f976105cf458843e8da50f96fec1506c1a2c111059d22c676df6d9 +size 112744581 diff --git a/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-64/global_step64/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-64/global_step64/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..475bd643e6eed24d900482ca32f37134a59a237e --- /dev/null +++ b/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-64/global_step64/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:588d0528dcf1721b9c635867e2d1cfe931f627c3a4df8e966d7ccb82d6d116d7 +size 112744453 diff --git a/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-64/global_step64/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-64/global_step64/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a7a4d4c60077c49e015fbe1ddc62d23a54312b2c --- /dev/null +++ b/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-64/global_step64/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e221647db107bb019cc65fa73d2c760445da0950a4dc8457884ce74dfb4ab13 +size 112744517 diff --git a/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-64/global_step64/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-64/global_step64/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..720ddc2155ae39b678fddc9ca0d2908b61d7c286 --- /dev/null +++ b/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-64/global_step64/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0f812a77da6b251eaa706b7de9831badfd7ba47e3aca4b624b31741c704c884 +size 112744581 diff --git a/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-64/global_step64/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-64/global_step64/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..38d61844d8f0d13dbfd2359089055a68bed029c7 --- /dev/null +++ b/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-64/global_step64/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48048f334fbfb4a83545d251ac1a30fd2f57d4106c8315609df73fcacfdddb9d +size 112744581 diff --git a/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-640/global_step640/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-640/global_step640/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7232545fc721f8e8cd28773dbfc46bcdfd42cecb --- /dev/null +++ b/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-640/global_step640/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1d7b21880dc152df3ae82f20f46c194b2cd46f3bc7b9ab0737e2abb1f966df9 +size 112744453 diff --git a/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-640/global_step640/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-640/global_step640/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4346ec824c4241a2f0ec6ff2997be4803a29bab9 --- /dev/null +++ b/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-640/global_step640/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:854c1306d3e4d70e73d6c62f0a4d258ae278b230321989ec3b10a460da459751 +size 112744517 diff --git a/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-640/global_step640/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-640/global_step640/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7fbfb7effe363a4538634d51e819e87e18ea8ce3 --- /dev/null +++ b/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-640/global_step640/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:077d8a64ec54768845e66be77995226ff4ad1e06820c54bad279ccd0dbcb4d87 +size 112744581 diff --git a/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-640/global_step640/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-640/global_step640/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4647e10f752c5d5b060f9e498fe550c680f490dc --- /dev/null +++ b/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-640/global_step640/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:178a27ca64066d60a723883444e9155bc961a2c0456f987d4488d1aeef34f88c +size 112744581 diff --git a/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-704/global_step704/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-704/global_step704/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..523e5b868374fd5f9dad6e37e1a6af1d6609e818 --- /dev/null +++ b/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-704/global_step704/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b687595595b09f127a33f921ec2a00d8eb8267e6668c2be94b23f2f52a1d098 +size 112744453 diff --git a/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-704/global_step704/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-704/global_step704/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a1a15addb1e582ed815eeadd4ae3c93fb24463b4 --- /dev/null +++ b/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-704/global_step704/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e1e453eebb9abd2f486dea54e0c01631e1c94b56ef77907c7125a91cc446b23 +size 112744517 diff --git a/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-704/global_step704/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-704/global_step704/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..740f97feb04ca651ffd32fecc0738096cd44d202 --- /dev/null +++ b/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-704/global_step704/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b10e4acae0c6c688d2c4ff1fcdfc9b2eabe37fd9f7c82b81e09184c23dc13b3b +size 112744581 diff --git a/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-704/global_step704/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-704/global_step704/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f1e5e74e81848e62070bf0e6e0130521f5740b0c --- /dev/null +++ b/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-704/global_step704/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48dcd7d1297bfb30567f306c3ef823e78b84dfe82b5cce8e7a02ce6cdf578af3 +size 112744581 diff --git a/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-768/global_step768/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-768/global_step768/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd7cbb4ba523792a948b7e3b596da2a73fd0453a --- /dev/null +++ b/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-768/global_step768/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96880b8a07727dff0f6ed5b8e2664a6f186e9cc69dc69eeb555a435d538e928c +size 112744453 diff --git a/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-768/global_step768/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-768/global_step768/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..df040e5a62402fae9551af1e56ac5bbc594b62c9 --- /dev/null +++ b/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-768/global_step768/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bdd10d229e0d02747581cda1f64dbcfa79efd7b30fbe89ad0dede590661fd3da +size 112744517 diff --git a/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-768/global_step768/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-768/global_step768/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f34eaafd93ae3c0c8fb9174df4ff11d62cc91f93 --- /dev/null +++ b/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-768/global_step768/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:540acb5826296ee78356dc105d7361b077766ab87ee2a52c421dad80aa9d9d93 +size 112744581 diff --git a/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-768/global_step768/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-768/global_step768/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f8f79efc7e37fedfe5d940fcb9a5c705e827c150 --- /dev/null +++ b/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-768/global_step768/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6712a25d20c11d9baa8f92bc31c7e20d4fb7fcc5818a5277e52a8141b3e49904 +size 112744581 diff --git a/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-832/global_step832/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-832/global_step832/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7925bcf6c5a940729f24179e3c8f2bfaf671e943 --- /dev/null +++ b/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-832/global_step832/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4db17ee1efffefe0bc5083301f0128fa597a7c02d94c8fb87ae44c4f75b01064 +size 112744453 diff --git a/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-832/global_step832/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-832/global_step832/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a270bc260f2121336dd69a9dfaa3c34644f4b29 --- /dev/null +++ b/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-832/global_step832/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c88af48b8f6dc22c6212f80afda930e4e1505941e035f3fd2fa236e1532792e +size 112744517 diff --git a/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-832/global_step832/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-832/global_step832/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a298b7cc15b6a5c78e8adfa11cf906602883d2c --- /dev/null +++ b/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-832/global_step832/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b192a5934e69615b34f13541bb995523d2d0f1bb187fef2667249c605c6997ad +size 112744581 diff --git a/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-832/global_step832/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-832/global_step832/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b9a957cce7376c39436babb4c6fdeb61948ec178 --- /dev/null +++ b/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-832/global_step832/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8a35f91694a63690e74e7670d1929582fa312c706bfa55f81190982e0e4d496 +size 112744581 diff --git a/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-896/global_step896/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-896/global_step896/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b8ff68de71868a8d66d6c4ee2a59d0f694deb729 --- /dev/null +++ b/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-896/global_step896/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02826c3bf16db1ca4e82b9ed35bc089bc0a12b8e66b041077ad39e6e4b8ed69b +size 112744453 diff --git a/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-896/global_step896/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-896/global_step896/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c897fcc6907d7f648bc9839ba50621021658bc97 --- /dev/null +++ b/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-896/global_step896/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14c7d4ba1ea576af91abd42919632dbc8ac9e7585ddd3c8b3db50bbdf9d047d4 +size 112744517 diff --git a/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-896/global_step896/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-896/global_step896/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6fe14b1d6465e6c8e7e4ee017a5a0f29fbfdabf9 --- /dev/null +++ b/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-896/global_step896/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1ecf66f588a293a787b363bdcaa30fb1e7e52f693c73d3ce10ad60b544680b2 +size 112744581 diff --git a/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-896/global_step896/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-896/global_step896/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..939a28503fc3e15cdcb2fa21551e3b896da5bcd2 --- /dev/null +++ b/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-896/global_step896/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30e2d29b44514e5fcc1a3a1cb23751a1319a3772be9acdf4e9497f2407227bd7 +size 112744581 diff --git a/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-896/global_step896/mp_rank_00_model_states.pt b/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-896/global_step896/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e272623cef56ae4ce22cf4466de2e2df759bb32f --- /dev/null +++ b/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-896/global_step896/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cef8d64700b4f15372a94c8c621244a6449ff01ab8a276180d4c4b1cd03e44ca +size 75529433 diff --git a/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-960/global_step960/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-960/global_step960/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..130f7f3c37ededf4c833f75221a8dd37e4b66ff8 --- /dev/null +++ b/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-960/global_step960/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dcc580e3b5995c9b0c434fe334ba8615ea24f8f71896c7ee8a0fd81b39832cab +size 112744453 diff --git a/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-960/global_step960/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-960/global_step960/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a110a9ad38632f201ab9136f5bc03e2921a4df3e --- /dev/null +++ b/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-960/global_step960/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6573b1b41d3c5aa24f219ad1291e820b5fcb8cd61607d5a79b4f721bd0d70a83 +size 112744517 diff --git a/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-960/global_step960/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-960/global_step960/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..af7e194e6a9bf3c06ea8b675c2f227c213a17197 --- /dev/null +++ b/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-960/global_step960/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0747d1f6ac256801e0ba754e45f1fcb77ec3de857861515c4be75ab3da308f7 +size 112744581 diff --git a/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-960/global_step960/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-960/global_step960/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..32cf99590eb74d44fa248166c740b97d5ce46f4d --- /dev/null +++ b/dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-960/global_step960/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:523ab8b5c5f5608ab108d9a77a41db62ae043c856cff8ee6b698186da163b3b2 +size 112744581 diff --git a/dapo_ia3_qwen2_5_1_5b_20251128_120647/adapter_model.safetensors b/dapo_ia3_qwen2_5_1_5b_20251128_120647/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..dd1e0ea51e66352dbe7835af7d53ae479ea2e04f --- /dev/null +++ b/dapo_ia3_qwen2_5_1_5b_20251128_120647/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60adeea85b30543a79cfc809c3e8f2b9eda7d88111eba2361e9d3920c70a421a +size 49582616 diff --git a/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-1024/global_step1024/mp_rank_00_model_states.pt b/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-1024/global_step1024/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..59d8e0a5245cbada13565cd8d50a4bdb3210b875 --- /dev/null +++ b/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-1024/global_step1024/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26292eaed3365503633b53ef3e926d07081c4bb8d07e8428d713c1171ba49807 +size 49768921 diff --git a/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-128/adapter_model.safetensors b/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-128/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..407ce13c92eeeb800b9272aba5427f9845467a6b --- /dev/null +++ b/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-128/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d411da0accc4c3694b34f72a497fe636a4d2f83845e9da226d8b0a2a18197ec +size 49582616 diff --git a/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-128/global_step128/mp_rank_00_model_states.pt b/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-128/global_step128/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f749e5d7cf3f3e6982a4ca8ad5e99683c9189139 --- /dev/null +++ b/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-128/global_step128/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68d501313a7e70d248b43a67c77c471fa662c4147c206ec975bb9f96b2419226 +size 49768921 diff --git a/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-192/adapter_model.safetensors b/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-192/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..13daedcfca43fb502528f7f0895a5535cfad6319 --- /dev/null +++ b/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-192/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7e7720a192f805000e8a9f300b05ee6d88da5e073735da202b1ed2524c6db1d +size 49582616 diff --git a/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-256/adapter_model.safetensors b/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-256/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5cd3e74a06e452479d4be52ec9a710b6f28a58aa --- /dev/null +++ b/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-256/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08cc7b0ce5f86bc89168dda412f63c9145c1239b16d5a06ada9fcfd5072bc504 +size 49582616 diff --git a/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-256/global_step256/mp_rank_00_model_states.pt b/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-256/global_step256/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..54517e6df0402d24a83ba27697e2fc0a67933b3f --- /dev/null +++ b/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-256/global_step256/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06c6735c164d3ee473424f5629db78c870d1ca5667bde0cb87e64ec6c9d639a8 +size 49768921 diff --git a/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-320/adapter_model.safetensors b/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-320/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..85d0eb7910073ede7d5f25a4ca62705e8a739b82 --- /dev/null +++ b/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-320/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48b0e10e9dff28a5f404a12ff71b200fa684e25b91ff3bbcad00ee998bed62ea +size 49582616 diff --git a/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-320/global_step320/mp_rank_00_model_states.pt b/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-320/global_step320/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..613b3990bca75212231a2540bd5e72ee169357f4 --- /dev/null +++ b/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-320/global_step320/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c02630efdc328b38ef0279055906e631adb659cb127f9d06d26b241233482c06 +size 49768921 diff --git a/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-384/adapter_model.safetensors b/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-384/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..138d164af1c95052225e9b64892a53a1a14c30ab --- /dev/null +++ b/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-384/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81dfeda7c2a446729f2dacfc914d51a7dd1ff5b77a8d2c562c4a433f7f91b28e +size 49582616 diff --git a/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-384/global_step384/mp_rank_00_model_states.pt b/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-384/global_step384/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..85456a70412a7059b0242eb485655ba98bdfceff --- /dev/null +++ b/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-384/global_step384/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe8827547ef3296b2db732ec828d05c541bb9d964480bcef3dc422a84dd78935 +size 49768921 diff --git a/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-448/adapter_model.safetensors b/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-448/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..84b2d5048856200bcaab470b8e0147a3ecf026fe --- /dev/null +++ b/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-448/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f78e043b85c81df6bab658ec9fa51dfd246ef5ad2b20bff5754ed7aa167dec27 +size 49582616 diff --git a/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-448/global_step448/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-448/global_step448/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..29de61d2d2c6551c7bd49589d5670574256e69e6 --- /dev/null +++ b/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-448/global_step448/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0e8b5109775bced1b99ab61b37d99e90bcfa34e999a1235bf0c271fd5e0d3f1 +size 74329285 diff --git a/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-448/global_step448/mp_rank_00_model_states.pt b/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-448/global_step448/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..36b5ca583f1e2f9e7ee426757d11ff06d9b5d935 --- /dev/null +++ b/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-448/global_step448/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17003a810b08be83cb8439ec5b061e81d66fb1c3959ce108cde15b29c020fa70 +size 49768921 diff --git a/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-512/adapter_model.safetensors b/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-512/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..09727cbcf91b72020af53b514dcc7ea2d06e3fa1 --- /dev/null +++ b/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-512/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a069f6213d30eb3f5f98fed416b0cf4c8e827fe43464d7e5e37f3cb39f69fad +size 49582616 diff --git a/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-512/global_step512/mp_rank_00_model_states.pt b/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-512/global_step512/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..928328286b9ccd92aca4766fa84e097d385a153b --- /dev/null +++ b/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-512/global_step512/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17e181ee34f8476f375e73090f2fe6f37d0f9b53ffc15a1c86100a07a2e46b80 +size 49768921 diff --git a/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-576/adapter_model.safetensors b/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-576/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5f716371996eb5e7a864d3319d35c8282eda3e04 --- /dev/null +++ b/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-576/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:485ec987b6a73db1f41206682ae8f6f7a88d510488a7571425ce96eb69d348d7 +size 49582616 diff --git a/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-576/global_step576/mp_rank_00_model_states.pt b/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-576/global_step576/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ef65abf6730daeaa92085fa1eaebe25f56e0a0e --- /dev/null +++ b/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-576/global_step576/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:88376d45142e6f8b16600a72dd28de27399209354e3cf0b0b8b821d17e66bce3 +size 49768921 diff --git a/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-64/adapter_model.safetensors b/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-64/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..bfc01015f32665256a1d3de3fe56e3bcb827c4c4 --- /dev/null +++ b/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-64/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48f86caf4590066e51e97af166906d864c5054d089ceb3ca4d0f6743cdfb0064 +size 49582616 diff --git a/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-64/global_step64/mp_rank_00_model_states.pt b/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-64/global_step64/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..476a3ad410f0874d33ac05d99a755d97c51267b6 --- /dev/null +++ b/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-64/global_step64/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a6efcc8be03990a6704ccf1007a06c32710bfd0f229bb33c0b54d6acaec8ef0 +size 49768921 diff --git a/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-640/adapter_model.safetensors b/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-640/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c9f5beed58e074380293fd3cbf9c2bb8ca25532a --- /dev/null +++ b/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-640/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a66bf6aaabf8f71d4a0bce66b548cbaa56cc7571abc2bebbcaaadbc44e6a728 +size 49582616 diff --git a/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-640/global_step640/mp_rank_00_model_states.pt b/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-640/global_step640/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e70dfc7228b73fb0183b6f3074e9f2522d2a4780 --- /dev/null +++ b/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-640/global_step640/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a6a9223cb937855bc52a09f0f9402cdcaf76165440487fe9bf417ecbca918fb +size 49768921 diff --git a/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-704/adapter_model.safetensors b/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-704/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ddb191010036b7b69fd3c260eeb35ee92aebd538 --- /dev/null +++ b/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-704/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:464be65dd26c93e418ef942f12742385964f301b7fe4169a74f4eaa86487cc0a +size 49582616 diff --git a/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-704/global_step704/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-704/global_step704/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1c456bfb5c187fac55d9e4d533fa84f46b081ffe --- /dev/null +++ b/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-704/global_step704/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43e72ca49e33fab4a65509479eff97c05e27fa2b85b0202801e9e897c462fcae +size 74329285 diff --git a/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-704/global_step704/mp_rank_00_model_states.pt b/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-704/global_step704/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..39ba3357ce0897423dd90e7a78a97774b3190c46 --- /dev/null +++ b/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-704/global_step704/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb8d5899012417880ca792153b2e6b6f2c63baf38f4cb247d896fe7067ad2f88 +size 49768921 diff --git a/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-768/adapter_model.safetensors b/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-768/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b2ffba6c24f6c0eb944d2237db8de8a57b2f5292 --- /dev/null +++ b/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-768/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:313ad658f350b62796cbc9adde11cb97a9e013c8ad8893ced51a3a9fe7c395fc +size 49582616 diff --git a/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-768/global_step768/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-768/global_step768/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..61abb8c02448bfc3c1743156432f5da0c6d454b1 --- /dev/null +++ b/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-768/global_step768/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:026a7f61b22f4fcaf5c504611b295e3486f28ab4f04d6cda7a422b59b51e14b5 +size 74329221 diff --git a/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-768/global_step768/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-768/global_step768/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..65d19e858f1b4c9d54c51d0887eeb35a80c973ab --- /dev/null +++ b/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-768/global_step768/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68ac23937e537d929ec47525f8232af8496883b067f86165b759cf5da5be9d5d +size 74329285 diff --git a/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-768/global_step768/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-768/global_step768/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a4b6b4de327bd07874c97f8b7977dd5fcd786925 --- /dev/null +++ b/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-768/global_step768/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64c679f0da2c0436ac53df66b4677275151b6fba498326f07e0c4a09ad0c0750 +size 74329285 diff --git a/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-768/global_step768/mp_rank_00_model_states.pt b/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-768/global_step768/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..65741da4f5f6910f70b7ca16b941c46bafc9f213 --- /dev/null +++ b/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-768/global_step768/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff8e9e4fee4e221d6fc76623697e1f5366e76e0fb1122267ea0e0e1fad2046e4 +size 49768921 diff --git a/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-832/adapter_model.safetensors b/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-832/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ca855dc6c045150be05ae1f0eaa62a661f248416 --- /dev/null +++ b/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-832/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba7b879372d76cbc7bcc2f0d7a830c3c4d5fe3ecb43d746d37b6bb75315c6878 +size 49582616 diff --git a/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-832/global_step832/mp_rank_00_model_states.pt b/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-832/global_step832/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..20f4b8ddea49ccdc98bf996961febe21fa65188c --- /dev/null +++ b/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-832/global_step832/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2af75626302e990b11abea575f5c7dddf303acd915108cb2725c859096e188e8 +size 49768921 diff --git a/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-896/adapter_model.safetensors b/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-896/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d86ccc14febe41ccef6f57e83f155f5cd75e4eb0 --- /dev/null +++ b/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-896/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23803230d1c05b622aec2c1b9800d0cfc501432b2450c68be8abcb8c52ea7b32 +size 49582616 diff --git a/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-896/global_step896/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-896/global_step896/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..09a014512d1b7ef80412b86d68aa67147a1438b8 --- /dev/null +++ b/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-896/global_step896/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e08069cc9125c72582bbd606743af0e937e2e80816876964f92fca4419a5b26 +size 74329285 diff --git a/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-896/global_step896/mp_rank_00_model_states.pt b/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-896/global_step896/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9ea859f015aa939db237f7659ca680b90de26580 --- /dev/null +++ b/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-896/global_step896/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e56f418496fadf919bc1e4449b560096c76a216f62ac8c683cd88ed673bc434c +size 49768921 diff --git a/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-960/adapter_model.safetensors b/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-960/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8afcdfaade3fc4efc66908f67a55e6a33067c69e --- /dev/null +++ b/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-960/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4bcd2252899e3f5ca6c8601301b3b3394448292c03e0a4c0ec7e52c9cd3c5063 +size 49582616 diff --git a/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-960/global_step960/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-960/global_step960/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b919b4e1b63e5af280fe7ba990b32e640f4f5a0 --- /dev/null +++ b/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-960/global_step960/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9a5671f698dd02a971fc1294180cf395833ae7aa183173dada2154302079d6a +size 74329221 diff --git a/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-960/global_step960/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-960/global_step960/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad1fa0995b4d1f8f32a4d3d1bba63d037b64a6ff --- /dev/null +++ b/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-960/global_step960/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:62e78cbf5e1f23f4905f2ca2188ddc30b04f91c541309d88753517e7eaf6d54f +size 74329285 diff --git a/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-960/global_step960/mp_rank_00_model_states.pt b/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-960/global_step960/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0b481341193cfd8767a1899399916a6d2c268f1d --- /dev/null +++ b/dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-960/global_step960/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f09bcafafdd4c03a476355b030a540dac2b1f3f365946bdcafced16522affe5 +size 49768921 diff --git a/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-192/tokenizer.json b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-192/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..1a2db243e47cbc113f6b2ddcc388aeeb8fe1a94c --- /dev/null +++ b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-192/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893 +size 11422778 diff --git a/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-384/tokenizer.json b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-384/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..1a2db243e47cbc113f6b2ddcc388aeeb8fe1a94c --- /dev/null +++ b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-384/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893 +size 11422778 diff --git a/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-448/tokenizer.json b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-448/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..1a2db243e47cbc113f6b2ddcc388aeeb8fe1a94c --- /dev/null +++ b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-448/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893 +size 11422778 diff --git a/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-512/adapter_model.safetensors b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-512/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c6c97042cc6e4d38989149446d1b71a4873b5af7 --- /dev/null +++ b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-512/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9521be9cfe491db04ad9d1181fa540edcc6d7e5d0e8e5da42c050de8e641d3fc +size 90096 diff --git a/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-512/global_step512/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-512/global_step512/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d86b4bac9def3e44005b3bbf4922618ce33928c2 --- /dev/null +++ b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-512/global_step512/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:894642575971aed64748557e6882ec6fdb8fe64ccf43b2852f5ec37588310e9b +size 134021 diff --git a/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-512/global_step512/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-512/global_step512/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e7d52f7012c4526fe7eb9f335dc820ac70736e71 --- /dev/null +++ b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-512/global_step512/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53406048a9a8d3f11214778b5e2a574f7700fee6e722c7b6783f7ecc44a74a32 +size 134021 diff --git a/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-512/global_step512/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-512/global_step512/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0d80efb7b0c08eeb1f49503823a3d5c330dc9cab --- /dev/null +++ b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-512/global_step512/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5171560eff7f5c8289573d2ade716afd6e33ebe01065ec46b6cfd73fb22623ac +size 134021 diff --git a/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-512/global_step512/mp_rank_00_model_states.pt b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-512/global_step512/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e08d74a30e9e0ce2d39a103040e2c7c027836cf1 --- /dev/null +++ b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-512/global_step512/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0911ea78ffc66bf4f47110f090ad66b9294aa4a46e25bdea6f8da102333cfa31 +size 128985 diff --git a/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-512/rng_state_0.pth b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-512/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..b36a98d84d656a25f163e9ca022d69411cd93722 --- /dev/null +++ b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-512/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:52f316014c4e138f5a8770e92802a4e621e88c8441f06ef2236c22f0133b98e4 +size 15365 diff --git a/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-512/rng_state_2.pth b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-512/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..15bed55db07f29cfb4a4f3a76a702c0d03b04cf4 --- /dev/null +++ b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-512/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bea1ecc7068774be82e1a9d57170240bb567b7ee995f34416627dda86a1fea7b +size 15429 diff --git a/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-512/scheduler.pt b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-512/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..4800a9e5803399b265ffcab0af9c3fe980dbd948 --- /dev/null +++ b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-512/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c0e61c4f166edd4bd232bd6fbefe6d67a5b7e00cb803d1741eac9a6d2b7b6ee +size 1465 diff --git a/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-512/tokenizer.json b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-512/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..1a2db243e47cbc113f6b2ddcc388aeeb8fe1a94c --- /dev/null +++ b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-512/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893 +size 11422778 diff --git a/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-512/training_args.bin b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-512/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..8ac17e830a9f541837500b71e4774e6dc6edc076 --- /dev/null +++ b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-512/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed168d6a9589ce234f8617f4a5c08efc010cf913d062feb34c93bf908724b319 +size 8913 diff --git a/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-576/adapter_model.safetensors b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-576/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6eeede4e44bc7a90df6bac08eddc8590ea5795ae --- /dev/null +++ b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-576/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0cc480ffe006bdb13aa05b114c9b9b347777b73e5668444eb55a5b77dfd9a0a1 +size 90096 diff --git a/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-576/global_step576/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-576/global_step576/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3573f849cc218b5ba5aef1d848f45ad86f67a833 --- /dev/null +++ b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-576/global_step576/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c073048cbafd01bab11bc1e99506ee0784f53ce72edf4706fbfe8fadabf22823 +size 134021 diff --git a/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-576/global_step576/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-576/global_step576/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..77af9ff6a6c89bcd87e61f2bcf94c9190c42fb23 --- /dev/null +++ b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-576/global_step576/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6bad986bdd94d8df4768c5eaeb71b23dd8103319b7ce0a632b27bd9d9425cd00 +size 134021 diff --git a/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-576/global_step576/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-576/global_step576/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..04f4dee992f2636e556246d435b3fad0e17a1401 --- /dev/null +++ b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-576/global_step576/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a33c090ec414ff363be1cd7678e23fc6e8d5001b94f751b821c2902048d58cf +size 134021 diff --git a/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-576/global_step576/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-576/global_step576/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bcf3e3ba623533e79806cd9274ac1e6bc4001530 --- /dev/null +++ b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-576/global_step576/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:539c633e2eb597167bcfe21d00c2892728c4bb09a4e4c819634d286f012c2c99 +size 134021 diff --git a/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-576/global_step576/mp_rank_00_model_states.pt b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-576/global_step576/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..92311dfd3cdf053dfebdb87fe464483ee078cea7 --- /dev/null +++ b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-576/global_step576/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df93e63c24b883aa95cda7d48720236ba8096e9bc5fcb738189f4fd71e10a924 +size 128985 diff --git a/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-576/rng_state_0.pth b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-576/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..29f4ca80bcb0a542764137722f1d073b735d150a --- /dev/null +++ b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-576/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e13ee24f6be171bb77a32274a7c9ccdad259b11adb811dd8ad1afc8a75a793a +size 15365 diff --git a/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-576/rng_state_1.pth b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-576/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..649b4202873112ecb37928f3eeedb4c4d8017072 --- /dev/null +++ b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-576/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96b378635996efc25457329a20d7156f7be2145bd600cf335112c145966019ea +size 15429 diff --git a/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-576/rng_state_2.pth b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-576/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..9787481df9f30b500805925e90e9fd889568bad6 --- /dev/null +++ b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-576/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6db05e45b2878ff1ba217fe87422098fbb1a1558d63a156cbe8c432e14d9cf9e +size 15429 diff --git a/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-576/rng_state_3.pth b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-576/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..c390921c94c7efd2ec9ffa676c1f1dd145c450c5 --- /dev/null +++ b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-576/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0af498059568b6281f5d76013d11c22fd595831718d48051639464ce0c5f26f +size 15429 diff --git a/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-576/scheduler.pt b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-576/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..454813a4990df191f6951cdef743cc653ff31f83 --- /dev/null +++ b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-576/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:105f4404298e62d6811a76a80078eaf19c435d835ba8926a324f78dfdc9fb5f1 +size 1465 diff --git a/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-576/training_args.bin b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-576/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..8ac17e830a9f541837500b71e4774e6dc6edc076 --- /dev/null +++ b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-576/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed168d6a9589ce234f8617f4a5c08efc010cf913d062feb34c93bf908724b319 +size 8913 diff --git a/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-64/adapter_model.safetensors b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-64/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3a13bb873cf9764b35954636916fba4f7a0a5400 --- /dev/null +++ b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-64/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:260f53455e007bb90ac8185e283b4cc9ff1795887076b9039201209655d3b386 +size 90096 diff --git a/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-64/global_step64/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-64/global_step64/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e5ec8a821bba49c0a1ad658ddb6fac348857eb9 --- /dev/null +++ b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-64/global_step64/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:263bdc028a51840f0cd79da2390abc1da28a8999d5045d27af7e06e2047fd70b +size 134021 diff --git a/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-64/global_step64/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-64/global_step64/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f1dfada2c2352579ed4800042cf65978be8043f8 --- /dev/null +++ b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-64/global_step64/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:934dcfe3629da24b0cd9262f5c1fe30a52d183f6814c5373fdead75af86bbd96 +size 134021 diff --git a/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-64/global_step64/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-64/global_step64/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a6cbff3c8f5338311fee7e49b7276869b69113e --- /dev/null +++ b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-64/global_step64/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6568bc8464422ca5e6aa7cdf8096a5c184451924c16e128ed9e620458e707de +size 134021 diff --git a/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-64/global_step64/mp_rank_00_model_states.pt b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-64/global_step64/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..54a0c84016b6937852843a8aca8e5fcf3c40dbeb --- /dev/null +++ b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-64/global_step64/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b57fdab947304ed2978b50982428be012ae41829ece7e52469b6fb199cd6a142 +size 128985 diff --git a/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-64/rng_state_1.pth b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-64/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..65d5e575915d9c4d54c6eaa737532eba1864c3e9 --- /dev/null +++ b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-64/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50f5d6a2cfdd2b29101c2f851dd94b5d1ae5896c5b8656d4539b81c3d12e4e59 +size 15429 diff --git a/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-64/rng_state_2.pth b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-64/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..c1ce8a838619d3145efd7890d7cf983339235e46 --- /dev/null +++ b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-64/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec4f7a7c8d333e6c850a003f8a3cc310aac2d3761c4d39a0c007fc6335ef03d9 +size 15429 diff --git a/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-64/rng_state_3.pth b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-64/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..d4fdd424e48a2dae1f5f7165645a68436384782b --- /dev/null +++ b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-64/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ebaa282c1bb65b32ffe51ad0742d6cd63555e4e6947b0bab6b047883a25a128 +size 15429 diff --git a/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-64/scheduler.pt b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-64/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..5f18e6fbca95d9546e2f67129f5c8f7ba7da9e16 --- /dev/null +++ b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-64/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93cefd10607223128e502b13dda034a13939769cee1c2b5c47751dc1ef0425c6 +size 1465 diff --git a/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-64/training_args.bin b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-64/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..8ac17e830a9f541837500b71e4774e6dc6edc076 --- /dev/null +++ b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-64/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed168d6a9589ce234f8617f4a5c08efc010cf913d062feb34c93bf908724b319 +size 8913 diff --git a/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-640/global_step640/mp_rank_00_model_states.pt b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-640/global_step640/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4fbc94e5aaa15dcde3eb14b653110ac098c38c6c --- /dev/null +++ b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-640/global_step640/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:486e9b4ceb3c36656d3b70bf6714ecc25453b5a683926e7a43c2a142f65ece02 +size 128985 diff --git a/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-640/rng_state_0.pth b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-640/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..fab261ecbb26f514884780056c9bf822d0a0857e --- /dev/null +++ b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-640/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2851c660de454422074fecbb18cc7eaea76561e5db0971a7b766fdb7825679de +size 15365 diff --git a/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-640/rng_state_1.pth b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-640/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..d93cbb2b084fb4289c7deae5aaf5fb37d4c11c0d --- /dev/null +++ b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-640/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19daf4d7b6993eccd0e46635c263c1a511e75edbb0eecfc39e3750053583a533 +size 15429 diff --git a/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-640/rng_state_2.pth b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-640/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..2fff698bf7d2856d22e3f8a3d22a8e494f225d0e --- /dev/null +++ b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-640/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d5483c6ddfc19185233701bad5a1b9b425ca9029b92279338a60bfa7ef885b9 +size 15429 diff --git a/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-640/rng_state_3.pth b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-640/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..315dbf2a43c985079d328d3ab271a17ce3687949 --- /dev/null +++ b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-640/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2832378e794e1d64a5d00dfe7d197e1374d2e3f74ff38ad99de1d4a89be65bc8 +size 15429 diff --git a/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-640/tokenizer.json b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-640/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..1a2db243e47cbc113f6b2ddcc388aeeb8fe1a94c --- /dev/null +++ b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-640/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893 +size 11422778 diff --git a/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-704/rng_state_1.pth b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-704/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..76e20a155c76743eedc47208fb4eb504d0a42bb4 --- /dev/null +++ b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-704/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f406bac444531deb7b18485e69760e4de192c7b090f24a2d640bd7904cb12c0 +size 15429 diff --git a/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-704/tokenizer.json b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-704/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..1a2db243e47cbc113f6b2ddcc388aeeb8fe1a94c --- /dev/null +++ b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-704/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893 +size 11422778 diff --git a/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-768/tokenizer.json b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-768/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..1a2db243e47cbc113f6b2ddcc388aeeb8fe1a94c --- /dev/null +++ b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-768/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893 +size 11422778 diff --git a/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-832/global_step832/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-832/global_step832/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c7213be157a3d3da76a3bd6fdb99bf9edf2c7854 --- /dev/null +++ b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-832/global_step832/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:141f33ad887c6df4e55ef0d26856974465cb6a93ad361ac47993f0ce9d0689e6 +size 134021 diff --git a/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-832/tokenizer.json b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-832/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..1a2db243e47cbc113f6b2ddcc388aeeb8fe1a94c --- /dev/null +++ b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-832/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893 +size 11422778 diff --git a/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-896/global_step896/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-896/global_step896/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc1d10ea74b8eb24698b218535a48267bb00a858 --- /dev/null +++ b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-896/global_step896/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f11f2ed5d59708edcb97c5b8976d3cf74a424c4da8390e056c9c7d5ba2a0da9e +size 134021 diff --git a/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-896/tokenizer.json b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-896/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..1a2db243e47cbc113f6b2ddcc388aeeb8fe1a94c --- /dev/null +++ b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-896/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893 +size 11422778 diff --git a/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-960/global_step960/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-960/global_step960/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c76149389be5e5ef485a215b476cb005bb9ad954 --- /dev/null +++ b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-960/global_step960/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27a8a5a98f28af12349030b99f3ebfe9b4dbac606e022ee8343bcc2d43f45f73 +size 134021 diff --git a/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-960/global_step960/mp_rank_00_model_states.pt b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-960/global_step960/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..20582ceb693f1673adf71b75c256a0e93183df30 --- /dev/null +++ b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-960/global_step960/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:209355c5d2cd14c6256e79194033d6d040ac395ef1866b52f29733a28ff8c560 +size 128985 diff --git a/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-960/tokenizer.json b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-960/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..1a2db243e47cbc113f6b2ddcc388aeeb8fe1a94c --- /dev/null +++ b/dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-960/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893 +size 11422778 diff --git a/dapo_lora_lr5_20251129_222821/adapter_model.safetensors b/dapo_lora_lr5_20251129_222821/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..accc7ea3fa5441e393b1b7e40652a0e2f25af184 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1e20188b1164f1fdab47932102775a74fbdadd8aac5cfcb2746eb50fb5cbd84 +size 73911504 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-1024/adapter_model.safetensors b/dapo_lora_lr5_20251129_222821/checkpoint-1024/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..accc7ea3fa5441e393b1b7e40652a0e2f25af184 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-1024/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1e20188b1164f1fdab47932102775a74fbdadd8aac5cfcb2746eb50fb5cbd84 +size 73911504 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-1024/global_step1024/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/dapo_lora_lr5_20251129_222821/checkpoint-1024/global_step1024/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..31776184c8d35b51004f9980d4c6c79016137054 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-1024/global_step1024/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b21eaea57143f4c5536ff1912ff12f878cedfab4bd385b6fdc5e0c6793332626 +size 110803077 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-1024/global_step1024/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/dapo_lora_lr5_20251129_222821/checkpoint-1024/global_step1024/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1d4ce425eb5d76ac490a26575d94aa39cfd94349 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-1024/global_step1024/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a61fd59ffc9ebbf15f590e71bece5c8f34411602afc0a1566c3ff5df6a9905c +size 110803077 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-1024/global_step1024/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/dapo_lora_lr5_20251129_222821/checkpoint-1024/global_step1024/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..93633d2617f1f935fb86366802a6c1b1a40e5934 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-1024/global_step1024/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0eccc99fc747c19c0d5fd1b8339a6b552586d15d91f2d135d0332e98d341e34e +size 110803141 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-1024/global_step1024/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/dapo_lora_lr5_20251129_222821/checkpoint-1024/global_step1024/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f757c2a01a0a940dbe1c94ad48c198cf5f45910d --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-1024/global_step1024/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e775fcc334a9a40c9712f8471f745d676b88cfe0ae874ce61c7a527b47e8be6c +size 110803141 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-1024/global_step1024/mp_rank_00_model_states.pt b/dapo_lora_lr5_20251129_222821/checkpoint-1024/global_step1024/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2954c6936eed235b9eec7f41a114488d61f9f671 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-1024/global_step1024/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:547fa851dacc6fb1d1605d6acc19d0816ad2ee3349db7b0d7a89a4f0aec74e2d +size 74161305 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-1024/rng_state_3.pth b/dapo_lora_lr5_20251129_222821/checkpoint-1024/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..ddfe26ddd7763f10275adb288473be28fda65e7f --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-1024/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c43118ba845b884b1d4434036bb862ab762eefcfc8d478d10e6c7e0dae84f44a +size 15429 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-1024/tokenizer.json b/dapo_lora_lr5_20251129_222821/checkpoint-1024/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..1a2db243e47cbc113f6b2ddcc388aeeb8fe1a94c --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-1024/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893 +size 11422778 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-1024/training_args.bin b/dapo_lora_lr5_20251129_222821/checkpoint-1024/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..e78e81b63006cdc50b56c1b4072bf15526a95a70 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-1024/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7dbb2821af3bd665530e3b952a48404896a15b24fe94e9581441c54cb95b8adb +size 8849 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-128/adapter_model.safetensors b/dapo_lora_lr5_20251129_222821/checkpoint-128/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..bd57a408b5c3a4fdf77ad185e837521d9cdd4311 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-128/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1328f0e1db129aa51a88a6e88c3ba2f64f8db96e26e8432d33c5b5496d95229 +size 73911504 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-128/global_step128/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/dapo_lora_lr5_20251129_222821/checkpoint-128/global_step128/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c0c28c14b9a8cb4e1c858f7c307247399ad42d0 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-128/global_step128/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fbbf3ce0c1ebac810027bb357069966ed98aa2b1e72b228c41fc52290b8103af +size 110803077 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-128/global_step128/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/dapo_lora_lr5_20251129_222821/checkpoint-128/global_step128/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d5008d124143d21e063f4f784adf63d996f00a5c --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-128/global_step128/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2fa991dbb89591106b918956e74b8ef233aed7f1e6e53a4dc860fb7aa3f6facc +size 110803077 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-128/global_step128/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/dapo_lora_lr5_20251129_222821/checkpoint-128/global_step128/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3e860afc1f5ac722e72ed73f418f759df73e6339 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-128/global_step128/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:543fc307fabcc2c772b1a2874e3d0495dc3b7f557e87d967046ec78585e24348 +size 110803141 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-128/global_step128/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/dapo_lora_lr5_20251129_222821/checkpoint-128/global_step128/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2814a855ee0660c454a9f23e45176ce1cf0c3046 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-128/global_step128/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a54ae91acf31128ada3cbf0e1958ef7a90f167ff8aa2d76a2869fc5478116e37 +size 110803141 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-128/global_step128/mp_rank_00_model_states.pt b/dapo_lora_lr5_20251129_222821/checkpoint-128/global_step128/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a41ec11b196949bb99a8d290de290b91a87ed96 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-128/global_step128/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4819229784eec68ffe16fe3dadc1250b048ea906cbccee57d57c21525bac329 +size 74161305 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-128/rng_state_1.pth b/dapo_lora_lr5_20251129_222821/checkpoint-128/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..ae1d9215ba65a5f0bc391c06d6a60cca9d0528a4 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-128/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21d8b5ea6790190b2fd966a9d37365585802bf2925fd443ec440a057b02c45a8 +size 15429 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-128/rng_state_2.pth b/dapo_lora_lr5_20251129_222821/checkpoint-128/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..76097c8b4a0e8a24ffd8a5ccf2f3062ce4516304 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-128/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0bff77fdb5746dde9b62ba1273b9d2048d40bb3acc5d39762b04d00411e999a +size 15429 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-128/rng_state_3.pth b/dapo_lora_lr5_20251129_222821/checkpoint-128/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..8d431f575596c6f6bc05aca86cd593d6d956d7a3 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-128/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:583364ec47aa83f4fc7acf10756189c6680c4ae68faf2681b7ce5ed1ea886af2 +size 15429 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-128/tokenizer.json b/dapo_lora_lr5_20251129_222821/checkpoint-128/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..1a2db243e47cbc113f6b2ddcc388aeeb8fe1a94c --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-128/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893 +size 11422778 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-128/training_args.bin b/dapo_lora_lr5_20251129_222821/checkpoint-128/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..e78e81b63006cdc50b56c1b4072bf15526a95a70 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-128/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7dbb2821af3bd665530e3b952a48404896a15b24fe94e9581441c54cb95b8adb +size 8849 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-192/adapter_model.safetensors b/dapo_lora_lr5_20251129_222821/checkpoint-192/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..146b5273669c9556395a0e0811bb9914bf29b6a3 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-192/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:52a9905cd9e3331c44f436c8161a7b035a01fa5919817ffd2647100699461b66 +size 73911504 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-192/global_step192/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/dapo_lora_lr5_20251129_222821/checkpoint-192/global_step192/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..81cf61fe2c2e4dcb33d841d6c64b00edace6bdf5 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-192/global_step192/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22f1b93272aa66b471c4cee5d0e7e6c77a338a87ef0cec9983a087e9d6ae591e +size 110803077 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-192/global_step192/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/dapo_lora_lr5_20251129_222821/checkpoint-192/global_step192/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dba06df456a5ec77dc32a5ed1e9f6f23fa0a135c --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-192/global_step192/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2edd86f7e037e3a03831e48d08640c32e408a9140d672ab822b6812ecaf65d9d +size 110803077 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-192/global_step192/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/dapo_lora_lr5_20251129_222821/checkpoint-192/global_step192/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..06491fd052f7253fae617d0765d8697707401314 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-192/global_step192/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39a7336092b5a2ddf404281336c06da2d7171953888a659c50a8cc50279aaab3 +size 110803141 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-192/global_step192/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/dapo_lora_lr5_20251129_222821/checkpoint-192/global_step192/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eebf635e4baf7d501a7e0b1d410cefaf8afd42c3 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-192/global_step192/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e5ac91c5d9290d5178fa3598c44acaa3ae226b557497e1f692a47357c9be694 +size 110803141 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-192/global_step192/mp_rank_00_model_states.pt b/dapo_lora_lr5_20251129_222821/checkpoint-192/global_step192/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bdc39ad6cd6bdf5df39139baf482e580f6d4cf48 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-192/global_step192/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0ebf21b582cfb6d6c55c3b9bb5565d189649a1b2f79e7e1f05bf4385aa87bbc +size 74161305 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-192/rng_state_0.pth b/dapo_lora_lr5_20251129_222821/checkpoint-192/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..287a6517eb7f927535fd2ad2ff6a60ec68461d1d --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-192/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81ce4494fd11f6d79ac4f4c27fbb1eef7d62e9a26b2fc54dd673dc9ef8d18b11 +size 15365 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-192/rng_state_1.pth b/dapo_lora_lr5_20251129_222821/checkpoint-192/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..191cc3d36c8cad83d39c14108916302f507080b2 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-192/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20982d4c69e2605b20be9fd104db5fecaf06259147ea5bf49a63dc2aa839246e +size 15429 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-192/rng_state_2.pth b/dapo_lora_lr5_20251129_222821/checkpoint-192/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..fbd68943079fa3488f5e966a40329176d4b3ae5d --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-192/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86fa348604a8b5bc83c2f1aac79977f7202fc3d1ca70cabb6e92f2b3592ea41f +size 15429 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-192/rng_state_3.pth b/dapo_lora_lr5_20251129_222821/checkpoint-192/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..92db4fc5d2a80a4c50741101cc6b6ba52838c31d --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-192/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39040c61e063a3822414d472ec246e81e692c27a044302a59e816ad5a601b5a0 +size 15429 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-192/scheduler.pt b/dapo_lora_lr5_20251129_222821/checkpoint-192/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..ee2ed012d28dc411958e61cf091e339df32c8799 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-192/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e72e25592f7d1a80ab924c960db7d294e745b6f4571ab693823a912de4596343 +size 1465 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-192/tokenizer.json b/dapo_lora_lr5_20251129_222821/checkpoint-192/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..1a2db243e47cbc113f6b2ddcc388aeeb8fe1a94c --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-192/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893 +size 11422778 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-192/training_args.bin b/dapo_lora_lr5_20251129_222821/checkpoint-192/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..e78e81b63006cdc50b56c1b4072bf15526a95a70 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-192/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7dbb2821af3bd665530e3b952a48404896a15b24fe94e9581441c54cb95b8adb +size 8849 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-256/adapter_model.safetensors b/dapo_lora_lr5_20251129_222821/checkpoint-256/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..49a9c6db281578fedc06b5756ae6d87af9b08944 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-256/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d9b6798ece4b40b2543e4cea63de96e023d0161418c82291046f00c87ec52a2 +size 73911504 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-256/global_step256/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/dapo_lora_lr5_20251129_222821/checkpoint-256/global_step256/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8b025e50c9dc6997d70be5134855d1ed89abf83c --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-256/global_step256/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2482bc8852f53c07bed199e09b6e41af43f60588da14c3e0a6271398191929f8 +size 110803077 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-256/global_step256/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/dapo_lora_lr5_20251129_222821/checkpoint-256/global_step256/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b78d71098ec5087de5f8960ad934d1f357296d1 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-256/global_step256/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a12877674b09ac3bd317e4c81136ba603be9e263fccf28eb4c666807115b1a28 +size 110803077 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-256/global_step256/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/dapo_lora_lr5_20251129_222821/checkpoint-256/global_step256/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..458317894b05a061a1ce1c9f04a5b200fa8f4826 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-256/global_step256/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91e8ffe5185dd2ae02b3ebdb62679167372587dbed737c715fa646082906e019 +size 110803141 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-256/global_step256/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/dapo_lora_lr5_20251129_222821/checkpoint-256/global_step256/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dec0da15041617734bd0d0c627771258c192acb2 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-256/global_step256/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e93a958cefb119892cf99234713d67eeed14243cde4da24102cce13feeda6312 +size 110803141 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-256/rng_state_0.pth b/dapo_lora_lr5_20251129_222821/checkpoint-256/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..0ce298cc5a562d19902634156a219f1a79eb999a --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-256/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c3b5ec4c0068ff222a5136e601982897aff66c8b52c47f2c2a94491fd23f132 +size 15365 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-256/rng_state_1.pth b/dapo_lora_lr5_20251129_222821/checkpoint-256/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..8cb2bb856079e51b0033f01b45476adfd3d4c3ec --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-256/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49f812001cf72095cafe8f7c083f9fc26c2f4985ce5e7a7dea7a9859e7ab2037 +size 15429 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-256/rng_state_2.pth b/dapo_lora_lr5_20251129_222821/checkpoint-256/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..3de9fdea8c36524953546cb5bbde357fda616bcd --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-256/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:475a12f119bd658b72bfb917f31c9fa74114ec00aba20c6f12e9bca65d5ee2e9 +size 15429 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-256/rng_state_3.pth b/dapo_lora_lr5_20251129_222821/checkpoint-256/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..1654b5aab1711b9b91591d648849d88aa08aa392 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-256/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ce7a24d755df01091f3d25ed0a452cdc19ce066f80fbb5f6eb14fd48c8a7dc0 +size 15429 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-256/scheduler.pt b/dapo_lora_lr5_20251129_222821/checkpoint-256/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..d79361b9ec23126977a661811ec74f55cc4f79ad --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-256/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5bab13b9c13486692a4d9095c0b2bac949df91be0aed9a3974630e119d40c852 +size 1465 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-256/tokenizer.json b/dapo_lora_lr5_20251129_222821/checkpoint-256/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..1a2db243e47cbc113f6b2ddcc388aeeb8fe1a94c --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-256/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893 +size 11422778 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-256/training_args.bin b/dapo_lora_lr5_20251129_222821/checkpoint-256/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..e78e81b63006cdc50b56c1b4072bf15526a95a70 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-256/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7dbb2821af3bd665530e3b952a48404896a15b24fe94e9581441c54cb95b8adb +size 8849 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-320/adapter_model.safetensors b/dapo_lora_lr5_20251129_222821/checkpoint-320/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e81889808815a2d0077e1992726a9f91232e3fac --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-320/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:57505c3ecab24e351e9f1fdcf965e36b8cbd87fcb18cd6efce672deced3b1b3a +size 73911504 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-320/global_step320/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/dapo_lora_lr5_20251129_222821/checkpoint-320/global_step320/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0eaf85adc3b77935f29c324ef4d74cf19507bc16 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-320/global_step320/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:abd34547d0eb3375e3bb588999c6b86f3c18e44fd6f8c7dee79456cdf11c3e03 +size 110803077 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-320/global_step320/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/dapo_lora_lr5_20251129_222821/checkpoint-320/global_step320/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8c9315b1c1c4dd47cdfc92b4f18da29725aa0a56 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-320/global_step320/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1ddedce2326b8fdbe18bd5811270b60a8e320eaffbb41a50c28e0b99cb8e073 +size 110803077 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-320/global_step320/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/dapo_lora_lr5_20251129_222821/checkpoint-320/global_step320/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..db184f87710c5c946bbf7597ba41dd04dbaa72d6 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-320/global_step320/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90075c5b1b4329cad41039fb0e7c184023e15aae61ee75261695422b9e534d0a +size 110803141 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-320/global_step320/mp_rank_00_model_states.pt b/dapo_lora_lr5_20251129_222821/checkpoint-320/global_step320/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0cea08036a3358cc647cd2e3e90f978b80286fbe --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-320/global_step320/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5eca4600080d01a21af95b49f54ff00ec10e217ba75b186e5110b734fdd3345 +size 74161305 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-320/rng_state_0.pth b/dapo_lora_lr5_20251129_222821/checkpoint-320/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..68f72aa7a9975cfcfc4bd3c59e25b91f07408014 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-320/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:773da3b693cdc998a8a4b55c13f3ce76bf4cea7d015352746fe9f729c4c1f71b +size 15365 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-320/rng_state_1.pth b/dapo_lora_lr5_20251129_222821/checkpoint-320/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..973aafc7db513813c83d4bd34b6895fe028594ba --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-320/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2233b25afb818cd5d94639f8340509007a067017eed5e11c9712cfed9041c29c +size 15429 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-320/rng_state_2.pth b/dapo_lora_lr5_20251129_222821/checkpoint-320/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..b6872fc9a242f9ecd1198ec263a71acb7c9821a0 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-320/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:331e2c819decb59a9dc79fe697581cb360f3d06d3879aff916e47cfae5b5febd +size 15429 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-320/rng_state_3.pth b/dapo_lora_lr5_20251129_222821/checkpoint-320/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..4190721021b466442009e591f70ff34cb53d7e32 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-320/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9899c2af221d37936ee01c01ca2e403d8c962c34b102de03897716b7ce30fed9 +size 15429 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-320/scheduler.pt b/dapo_lora_lr5_20251129_222821/checkpoint-320/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..25d78429549a8273f8b70b55f94bfff35d15ec9d --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-320/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ccc10e2931755bee96f95e5427c7b1da4cb590b7570e9ec1749d869d514d58f +size 1465 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-320/tokenizer.json b/dapo_lora_lr5_20251129_222821/checkpoint-320/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..1a2db243e47cbc113f6b2ddcc388aeeb8fe1a94c --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-320/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893 +size 11422778 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-320/training_args.bin b/dapo_lora_lr5_20251129_222821/checkpoint-320/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..e78e81b63006cdc50b56c1b4072bf15526a95a70 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-320/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7dbb2821af3bd665530e3b952a48404896a15b24fe94e9581441c54cb95b8adb +size 8849 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-384/adapter_model.safetensors b/dapo_lora_lr5_20251129_222821/checkpoint-384/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5c0b1aea55d128d047885020d0ff38f7a744ad5b --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-384/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0902fa8966e294b9e4ae5dcae1633180d5b36251676a0baff0c3f4cd2e8f4b37 +size 73911504 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-384/global_step384/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/dapo_lora_lr5_20251129_222821/checkpoint-384/global_step384/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0bc013af08ffbfeeb168fe6f9db940d06dbaf283 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-384/global_step384/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:47a225cc0f52403bc84ae2931230822a24df4769207052579ef8995dff4a97d8 +size 110803077 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-384/global_step384/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/dapo_lora_lr5_20251129_222821/checkpoint-384/global_step384/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..65548209ecfa05486dd4164175a861b9530a1ba1 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-384/global_step384/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b08c99046fbb42c876726170c91c11babb7cb9d5a908b106d4ca4fe8e043d7a +size 110803077 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-384/global_step384/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/dapo_lora_lr5_20251129_222821/checkpoint-384/global_step384/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e690f1064d48be88f5eb9c047f1bdcae39b3b7b5 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-384/global_step384/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49bd14290d85322f7d411c141319929c0c855f99013398079700dd24f33245fe +size 110803141 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-384/global_step384/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/dapo_lora_lr5_20251129_222821/checkpoint-384/global_step384/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8b70fe0ca9653954e4928280720823c8f19c46da --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-384/global_step384/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:564e429f46c05cc6675751f3d961cb2aaed03d3210d4f6c201131312204e1eed +size 110803141 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-384/global_step384/mp_rank_00_model_states.pt b/dapo_lora_lr5_20251129_222821/checkpoint-384/global_step384/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..91f2f00c5f9f625c0d2b1986e8e30ba4581a4111 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-384/global_step384/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:266d1f505f215966874bf934e26d6ae4bad15f1b0d4db7b05f9af4f79eff2a25 +size 74161305 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-384/rng_state_0.pth b/dapo_lora_lr5_20251129_222821/checkpoint-384/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..46b96a211e5503e0c1fb66b8bfd48d0fd967f3ff --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-384/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71690324d59e3863af46f37a2adff414c63bc7ce6f29cf44bd2604ff63f0d65b +size 15365 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-384/rng_state_1.pth b/dapo_lora_lr5_20251129_222821/checkpoint-384/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..6a0705cffa6abe4494fff7efc199a2cb4c7ce02b --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-384/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92a8b1af3bd0bfd96fc014c50f8f162778a01f402dd9dc50dfdb53253b07a51a +size 15429 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-384/rng_state_2.pth b/dapo_lora_lr5_20251129_222821/checkpoint-384/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..2f30b595134318115c4a9f3512e8f664b0bf7421 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-384/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b7a08b033e63616b83d078704eb3d8a058d75df29711016194fa41f7973f156 +size 15429 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-384/rng_state_3.pth b/dapo_lora_lr5_20251129_222821/checkpoint-384/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..128f56899ed876b33d220a42e8b1110ca38499f2 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-384/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b7f0132605651191b3932d24f9bfb1d8c65956cee64523c3f571f59fa09b68e +size 15429 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-384/scheduler.pt b/dapo_lora_lr5_20251129_222821/checkpoint-384/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..a1f059ada03dec0fd6b0c52f512e29ef0acc49fc --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-384/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:872697f665d017696a414cd8d3baee9fa3ca3d7c0f1efd82989df03c6f052411 +size 1465 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-384/tokenizer.json b/dapo_lora_lr5_20251129_222821/checkpoint-384/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..1a2db243e47cbc113f6b2ddcc388aeeb8fe1a94c --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-384/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893 +size 11422778 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-384/training_args.bin b/dapo_lora_lr5_20251129_222821/checkpoint-384/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..e78e81b63006cdc50b56c1b4072bf15526a95a70 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-384/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7dbb2821af3bd665530e3b952a48404896a15b24fe94e9581441c54cb95b8adb +size 8849 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-448/adapter_model.safetensors b/dapo_lora_lr5_20251129_222821/checkpoint-448/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d0b7ec6672b4093da5ccbc4dde846674fb03cd4f --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-448/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5e3ca544665b6916fa37026cc076755fba7eeb9e507509b6c13a175df9b58e9 +size 73911504 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-448/global_step448/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/dapo_lora_lr5_20251129_222821/checkpoint-448/global_step448/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b19399a3619ffad874026702ff3ddf27c166cd0 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-448/global_step448/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ce3eef2f8607515248902a07e4d2d2819ad6459eec03cb30dfadc6cfad902d7 +size 110803077 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-448/global_step448/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/dapo_lora_lr5_20251129_222821/checkpoint-448/global_step448/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aba52e7fc24a19fd24184b9a46d5f8d1bbb17e4d --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-448/global_step448/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73701be4e4888223cc6285d4dd97b344c82744d1e3849d30ad6043954f636880 +size 110803077 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-448/global_step448/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/dapo_lora_lr5_20251129_222821/checkpoint-448/global_step448/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5c4dc2ec329053977e7b13df6c5d72ebc277b62f --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-448/global_step448/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b3f71ef609811ae75e197d467083ed951b2fd47cd18e0fbc2f296bfede8e0f2 +size 110803141 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-448/global_step448/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/dapo_lora_lr5_20251129_222821/checkpoint-448/global_step448/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cebefe2d9ba55a58025d3c5972e31b8f1f6d3e56 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-448/global_step448/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:214fd4040b5121dcbc891668195177cd4dfb424814f52b6573b57615a900dc12 +size 110803141 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-448/global_step448/mp_rank_00_model_states.pt b/dapo_lora_lr5_20251129_222821/checkpoint-448/global_step448/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cbac97bdaac9591425cb8e78cf9ad5a2c6f159a5 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-448/global_step448/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba74ca6dd454409fc4ade976b98bbe6f2a4d22dfdd84ee1c360c5dd027dc94f9 +size 74161305 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-448/rng_state_0.pth b/dapo_lora_lr5_20251129_222821/checkpoint-448/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..e9612e77e96be134d6089219689f8a1ce77e3e96 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-448/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9650dc1f7525313ae92081f236a496de6a4f176acd19c7112c90eb95219601a0 +size 15365 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-448/rng_state_1.pth b/dapo_lora_lr5_20251129_222821/checkpoint-448/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..08c6224a18ae4fd70ed06fc25de908bbf2b82d28 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-448/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5d60af193b4bd3cf61688b27bd12a9c75347576b4d4cc53f6f58f1824ca8a67 +size 15429 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-448/rng_state_2.pth b/dapo_lora_lr5_20251129_222821/checkpoint-448/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..a079f7027d94368f89ca4dc51ac74e59f815a35b --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-448/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0cc58f5d86c9d911509594f69212c4654f578f15771812f015cb0f6623ce274a +size 15429 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-448/rng_state_3.pth b/dapo_lora_lr5_20251129_222821/checkpoint-448/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..0f1527d75b4ebc656f719af0af727f56f8a882aa --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-448/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e49e57e55215e45c6eb725c3c3091cde496e50b6a64c7c7a9e036778bb9442a8 +size 15429 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-448/scheduler.pt b/dapo_lora_lr5_20251129_222821/checkpoint-448/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..a770dc2e646f1b88c0f265cf79c79035aafc45e1 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-448/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7fbc511b021530886f21a273892f93d99bfb91c5cf259d5b4e6f13c8d53879b3 +size 1465 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-448/tokenizer.json b/dapo_lora_lr5_20251129_222821/checkpoint-448/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..1a2db243e47cbc113f6b2ddcc388aeeb8fe1a94c --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-448/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893 +size 11422778 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-448/training_args.bin b/dapo_lora_lr5_20251129_222821/checkpoint-448/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..e78e81b63006cdc50b56c1b4072bf15526a95a70 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-448/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7dbb2821af3bd665530e3b952a48404896a15b24fe94e9581441c54cb95b8adb +size 8849 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-512/adapter_model.safetensors b/dapo_lora_lr5_20251129_222821/checkpoint-512/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b255493dc7f5cb4819e9ae36571bad775f8133d2 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-512/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3053f6153d26d940696e7e8efae98463be63ef679dcfac5b177d1c7d016e7ac +size 73911504 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-512/global_step512/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/dapo_lora_lr5_20251129_222821/checkpoint-512/global_step512/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7f0e25b410d999d8d0715805dbd7ed2236f20184 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-512/global_step512/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e1c058f06c0ed56d910825270b7b7d41b3fb8086168522d917a1db000a79fe1 +size 110803077 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-512/global_step512/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/dapo_lora_lr5_20251129_222821/checkpoint-512/global_step512/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6f3032dc4a5df7c266bbd0ee59859313c1a203e4 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-512/global_step512/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de6f620ba474e5eab2278966fcd3d956df2ab84a34482e31daf7beaecea03122 +size 110803077 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-512/global_step512/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/dapo_lora_lr5_20251129_222821/checkpoint-512/global_step512/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..01a34a10583172821183c45dc4f9e85ff64f400b --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-512/global_step512/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75fef8c9f725899d8d08e157186e5ba42afb3b96b3dc732f2aa6712382de59f7 +size 110803141 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-512/global_step512/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/dapo_lora_lr5_20251129_222821/checkpoint-512/global_step512/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bae89993405ccb1b0459c9f847346ef19a8ce540 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-512/global_step512/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b87af92b074d4e6ed42e80382f0b82d826f83fe1064953c5544cb5c978c97e7 +size 110803141 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-512/global_step512/mp_rank_00_model_states.pt b/dapo_lora_lr5_20251129_222821/checkpoint-512/global_step512/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a154b8f93b4eb203f16bc9e2d509437288bce2ef --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-512/global_step512/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4153ff871e8ecc3d4693d8623bef50ef8872889e15d538b94c5f026a45e1b6c +size 74161305 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-512/rng_state_0.pth b/dapo_lora_lr5_20251129_222821/checkpoint-512/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..b254adca7b97ab1ac38582a5ce8ddcf97871b5e7 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-512/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca4011db9e524c07ed38d02d5a21f405e242a1d6a7f97d9eed9806a72fa5aded +size 15365 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-512/rng_state_1.pth b/dapo_lora_lr5_20251129_222821/checkpoint-512/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..23d344ec7e3888b5e517f14d46e5cb6f631ee249 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-512/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2cd63113cd6b8652baab477dbee6d9bb6d049bbd96402eccb7f1e91ba306b643 +size 15429 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-512/rng_state_2.pth b/dapo_lora_lr5_20251129_222821/checkpoint-512/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..6cf7282c5d0118b8502485b9ba4e221e41f911e8 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-512/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84c388265f8b2bb9223c8ff3dbb6150f6a2f0f81029c93a02a74650734b13edc +size 15429 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-512/rng_state_3.pth b/dapo_lora_lr5_20251129_222821/checkpoint-512/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..6d9377332821cbfd3108329291c41b944ce7cdb5 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-512/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27d94c00d9665d06746ec72204dd1db3583ceb2dd1d7c8f1d42cd2216e4457c9 +size 15429 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-512/scheduler.pt b/dapo_lora_lr5_20251129_222821/checkpoint-512/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..d65b5feaafdb3cc72c6ef0adb0b4c07de5bc8064 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-512/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1623515ab61bb9f5ac3efabd82b4ce31993463950d4e106cf55a565102542095 +size 1465 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-512/tokenizer.json b/dapo_lora_lr5_20251129_222821/checkpoint-512/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..1a2db243e47cbc113f6b2ddcc388aeeb8fe1a94c --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-512/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893 +size 11422778 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-512/training_args.bin b/dapo_lora_lr5_20251129_222821/checkpoint-512/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..e78e81b63006cdc50b56c1b4072bf15526a95a70 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-512/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7dbb2821af3bd665530e3b952a48404896a15b24fe94e9581441c54cb95b8adb +size 8849 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-576/adapter_model.safetensors b/dapo_lora_lr5_20251129_222821/checkpoint-576/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..daba91acfed09e6abd0ffd694f7c6da3b7c75d30 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-576/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d08f0263a6fb7388e548141b74c750aa5b5711f540d27d4320178472164b7a39 +size 73911504 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-576/global_step576/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/dapo_lora_lr5_20251129_222821/checkpoint-576/global_step576/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..829be1ceec9c04d94b56e74e3e2973f0493b9a1b --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-576/global_step576/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:63c26d272f603fd31b8db57d857c4aa9cbb2b7b383f43569a942db601b1341ba +size 110803077 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-576/global_step576/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/dapo_lora_lr5_20251129_222821/checkpoint-576/global_step576/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..504c17db7da9f420b956991153241ba758ae01cf --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-576/global_step576/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2a5b1e91d99c08fb373649dd494300fe3fc56961126157320eb185ffddc3128 +size 110803077 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-576/global_step576/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/dapo_lora_lr5_20251129_222821/checkpoint-576/global_step576/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..584415fe9def3ed364ab1b3e6764ff10ab4fd042 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-576/global_step576/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dad3c3ac7145aebb288124f43021be639e187673717ba1ac4d4c1139ecb0c05f +size 110803141 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-576/global_step576/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/dapo_lora_lr5_20251129_222821/checkpoint-576/global_step576/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..51c7754938d99b8904701f8e4d44780052980d2d --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-576/global_step576/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3eb2f380389c96e580734a178584cca817be8392d5c63f6a5aa5841b438e0f25 +size 110803141 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-576/global_step576/mp_rank_00_model_states.pt b/dapo_lora_lr5_20251129_222821/checkpoint-576/global_step576/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2658e02a545ef13330a21254a7112075fc5ccaf1 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-576/global_step576/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e4275a039cae49426cf3d63f8a52e9ac3bb0745bcae4b917d1ccfc126d7b641 +size 74161305 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-576/rng_state_0.pth b/dapo_lora_lr5_20251129_222821/checkpoint-576/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..32f05e01480e95ada8b7cd51df1859b0f6437e17 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-576/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:093b00b46c833fdbcb1e0433e8feae8fa51e281304566fa20cc400f7182d7cfe +size 15365 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-576/rng_state_1.pth b/dapo_lora_lr5_20251129_222821/checkpoint-576/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..6a14ff21f7e3e09072fe998bb96cdae2ce4758de --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-576/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7e1cea4eb8c68c33a4caf71c738a03fcdb486e1f0fbe4507c1a01696beeeecf +size 15429 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-576/rng_state_2.pth b/dapo_lora_lr5_20251129_222821/checkpoint-576/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..0fcbaf29566811438b7966287b8efd00a6d07e67 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-576/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9abe5a83bc642919defed3290e3781744b72ceb81343450cb0d79f18b409ea2 +size 15429 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-576/rng_state_3.pth b/dapo_lora_lr5_20251129_222821/checkpoint-576/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..0df507d4eea872570d1b3dfe2a2a4dc437e571a1 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-576/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a6400f6266b9248f65bc1de29eca66c2ad403c99e71d4aaaa93ea2cdbb61233 +size 15429 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-576/scheduler.pt b/dapo_lora_lr5_20251129_222821/checkpoint-576/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..9aaaadf4abf233837dfafbed736613bbcaa7ab58 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-576/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4006a4399a7418c442d24747fd14d2dce24a682b5296c6c7e11ec68a7769e01 +size 1465 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-576/tokenizer.json b/dapo_lora_lr5_20251129_222821/checkpoint-576/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..1a2db243e47cbc113f6b2ddcc388aeeb8fe1a94c --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-576/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893 +size 11422778 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-576/training_args.bin b/dapo_lora_lr5_20251129_222821/checkpoint-576/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..e78e81b63006cdc50b56c1b4072bf15526a95a70 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-576/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7dbb2821af3bd665530e3b952a48404896a15b24fe94e9581441c54cb95b8adb +size 8849 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-64/adapter_model.safetensors b/dapo_lora_lr5_20251129_222821/checkpoint-64/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..75f0de435bbccb549678eede9df2779812480c2e --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-64/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4da85a9cd45ac041dde839b9a037887b52e103a9287f178ac57c41ccf97313cd +size 73911504 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-64/global_step64/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/dapo_lora_lr5_20251129_222821/checkpoint-64/global_step64/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dd947a4832050dff36543ea9d3f3c85a52a09e0e --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-64/global_step64/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:115d3aaf729e85ce37d0c31d94d80140125c978b4db611256d23005d792c27eb +size 110803077 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-64/global_step64/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/dapo_lora_lr5_20251129_222821/checkpoint-64/global_step64/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d852d26a716242a60e7737ec7b2a0e991d87618 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-64/global_step64/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0fa04fe48b43c20a71dbfb380f90f8e04c3a843b58b31b6cf83275592df1a957 +size 110803141 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-64/global_step64/mp_rank_00_model_states.pt b/dapo_lora_lr5_20251129_222821/checkpoint-64/global_step64/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..75c2a5211bdae1d7834c5bbfc8504b11d6bab413 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-64/global_step64/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c1a55ab0d38667ae33ca5436d19141a5bee4971548484a9fb4e1d380f36184e +size 74161305 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-64/rng_state_0.pth b/dapo_lora_lr5_20251129_222821/checkpoint-64/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..a91cb4b889a01a26c494a3ae3c8d0f0d5ca91b98 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-64/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be1739c2717bc420e7fa2a7a8a74c3f4295c278b6b4765e1ebf1701a6997d4ca +size 15365 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-64/rng_state_1.pth b/dapo_lora_lr5_20251129_222821/checkpoint-64/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..5fa76239050e34144895d2d138b654d88189f6e2 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-64/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04f8054ec45180a327a6722e6276fc1d855eb5b61a89dcfabdc6b7f68d160bbd +size 15429 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-64/rng_state_2.pth b/dapo_lora_lr5_20251129_222821/checkpoint-64/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..74b178d8eefa45c9b385d2bd64743ef4106b913f --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-64/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7da6b70e6c0ee5c456e4c987f202ae5d860955f0422f289d49fa0c3d47e76a6 +size 15429 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-64/rng_state_3.pth b/dapo_lora_lr5_20251129_222821/checkpoint-64/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..89a82264ec594b14dffe33dd8049817a3dc80433 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-64/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07d641f8b09fd96d3af3ab10d3f9b9b7cced9d70719fd4a49e92e46d82951cbf +size 15429 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-64/scheduler.pt b/dapo_lora_lr5_20251129_222821/checkpoint-64/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..61decf82d077ac931099f78358613eeedbb8e985 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-64/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1cb6ce5761cdf285e895d668f986035bdeae8b6ae41fda12bb832664dc3eb080 +size 1465 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-64/tokenizer.json b/dapo_lora_lr5_20251129_222821/checkpoint-64/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..1a2db243e47cbc113f6b2ddcc388aeeb8fe1a94c --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-64/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893 +size 11422778 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-64/training_args.bin b/dapo_lora_lr5_20251129_222821/checkpoint-64/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..e78e81b63006cdc50b56c1b4072bf15526a95a70 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-64/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7dbb2821af3bd665530e3b952a48404896a15b24fe94e9581441c54cb95b8adb +size 8849 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-640/global_step640/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/dapo_lora_lr5_20251129_222821/checkpoint-640/global_step640/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7eeddcd2bb19f50a345ef4e2adef51c5b135ee6b --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-640/global_step640/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd8de766bc2bea9001e941513d88c7f67e1326f6fbc0ba88cbb1fe030618624f +size 110803077 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-640/global_step640/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/dapo_lora_lr5_20251129_222821/checkpoint-640/global_step640/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f9964f77d23d9b26e8822523ea3a39c94b4c922b --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-640/global_step640/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17d021055d605ea55724b732b189727cedb4da253fd8855440f6630f206a9303 +size 110803077 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-640/global_step640/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/dapo_lora_lr5_20251129_222821/checkpoint-640/global_step640/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7ec9d41b0b737c48b249cea65336148bb152d411 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-640/global_step640/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35adc429112bd4c4f26cd52e339c241e56092d624dc9392001d630db469edf56 +size 110803141 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-640/global_step640/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/dapo_lora_lr5_20251129_222821/checkpoint-640/global_step640/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..77fd050e81efcbd39b39832e8b3de244769e27c8 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-640/global_step640/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3970c4ab3479c3d1c50627fd12dcb13bff6d683e367fdd73fcd610b2624bc3d1 +size 110803141 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-640/global_step640/mp_rank_00_model_states.pt b/dapo_lora_lr5_20251129_222821/checkpoint-640/global_step640/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..34a7a788246667d995e504a45b552768632b0a3e --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-640/global_step640/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc5a834d0a1ad121da440f08fcb33dd2054c077f279a45312a785025fa59b1f7 +size 74161305 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-640/rng_state_0.pth b/dapo_lora_lr5_20251129_222821/checkpoint-640/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..1e0c77cccd4e96b373b88f0d9290f79493e7dcf9 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-640/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2806df115ce5720b0ea69b3cb98fe71c430f67748cb2af4507dd1033e52acc51 +size 15365 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-640/rng_state_1.pth b/dapo_lora_lr5_20251129_222821/checkpoint-640/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..76241e111235dfb06f3c1dd066b71e0a312e19f6 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-640/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae1562abf36a9bb196c016e8cc504dfd8088f3426001a4203635c48927e6d797 +size 15429 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-640/rng_state_2.pth b/dapo_lora_lr5_20251129_222821/checkpoint-640/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..0c16337a9bcbf62253e3583fb9d8f19e837a4bed --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-640/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3912162cd19c1a8033ecb25579b1af1ffc50d622c62030d96460a7ca580dff8e +size 15429 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-640/rng_state_3.pth b/dapo_lora_lr5_20251129_222821/checkpoint-640/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..9e72a7ebfef150f6601c03676d8ee1f475682cff --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-640/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9def8c8a324194f677318a74870becc6b743d32c9b88d337ead1ed3c161306d6 +size 15429 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-640/scheduler.pt b/dapo_lora_lr5_20251129_222821/checkpoint-640/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..b1f99fb81b2d16821d6004347383d3ec0c00fcb7 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-640/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:095a20924dc9207e75419ac4f3ee8eb9d90b86284b88bf35444f0c9968a37f88 +size 1465 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-640/tokenizer.json b/dapo_lora_lr5_20251129_222821/checkpoint-640/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..1a2db243e47cbc113f6b2ddcc388aeeb8fe1a94c --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-640/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893 +size 11422778 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-640/training_args.bin b/dapo_lora_lr5_20251129_222821/checkpoint-640/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..e78e81b63006cdc50b56c1b4072bf15526a95a70 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-640/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7dbb2821af3bd665530e3b952a48404896a15b24fe94e9581441c54cb95b8adb +size 8849 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-704/adapter_model.safetensors b/dapo_lora_lr5_20251129_222821/checkpoint-704/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3091ae5799d374492d41578c4c86ae461147665b --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-704/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:803fe845e0ae3772f811bfabe3263e7d03bcb157009c876d15615be902c27add +size 73911504 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-704/global_step704/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/dapo_lora_lr5_20251129_222821/checkpoint-704/global_step704/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd47127dfd14eec4d6a3963cfcc95e9823d2c6fa --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-704/global_step704/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d5f6cab22a5abb5400223a6836896f815854141b089051af871ba49c6ed42cf +size 110803077 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-704/global_step704/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/dapo_lora_lr5_20251129_222821/checkpoint-704/global_step704/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a51a6e07541c3377826571c16e490a9d07b3e8dc --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-704/global_step704/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44f83af0816ccdd6e955c2972182c0a0c20c4ecf324967381bb4fa1130757b08 +size 110803141 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-704/rng_state_0.pth b/dapo_lora_lr5_20251129_222821/checkpoint-704/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..b18f7e27713acf50c86013f19680954c9089e2d4 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-704/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1fbf960adaad04b7256ce45bc752cda965c03a678f4e3e75395c421b92855aa2 +size 15365 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-704/rng_state_1.pth b/dapo_lora_lr5_20251129_222821/checkpoint-704/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..4c5cf1352cbdf7d2a09ccec893c775c29bb69885 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-704/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32587f9864d9512da7c9e895260895e309ccbfa5d9ace21540f8c53fb0c66d41 +size 15429 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-704/rng_state_2.pth b/dapo_lora_lr5_20251129_222821/checkpoint-704/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..4f5fda93aed25fef4add5314e36749f31411ee2f --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-704/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f33aa670e181785bce15ded10e48ce24a2065dc6976c3e4be4eccf96a20f3ae8 +size 15429 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-704/rng_state_3.pth b/dapo_lora_lr5_20251129_222821/checkpoint-704/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..11655844e972c65c66e5d3e37c7247d9404291e5 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-704/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e24445d819ea67582f08f9f47b832996c4fbbedf75f6144ec2d70af2589451cd +size 15429 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-704/scheduler.pt b/dapo_lora_lr5_20251129_222821/checkpoint-704/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..59b6d1a3fa824eb802acfda1f213b36019c3aa79 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-704/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:332919ffe79eef0ddf3bdfa22c9cc34e5cbc1998d906df46b1911c38134b913e +size 1465 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-704/tokenizer.json b/dapo_lora_lr5_20251129_222821/checkpoint-704/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..1a2db243e47cbc113f6b2ddcc388aeeb8fe1a94c --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-704/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893 +size 11422778 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-704/training_args.bin b/dapo_lora_lr5_20251129_222821/checkpoint-704/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..e78e81b63006cdc50b56c1b4072bf15526a95a70 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-704/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7dbb2821af3bd665530e3b952a48404896a15b24fe94e9581441c54cb95b8adb +size 8849 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-768/adapter_model.safetensors b/dapo_lora_lr5_20251129_222821/checkpoint-768/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..94d9daa833c276d52b7f7307ce86126d24000fe1 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-768/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e8bb3216f4de532f60f10ecb1f07d85dd1800040efcab4207d3af1f4752edf3 +size 73911504 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-768/global_step768/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/dapo_lora_lr5_20251129_222821/checkpoint-768/global_step768/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..081d214d5a246daabab563862e8347ca65c9ed06 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-768/global_step768/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07dcecf7cbc4d573a513a30d836af8b8d475a66f9968db77c7f74653fee6af60 +size 110803077 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-768/global_step768/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/dapo_lora_lr5_20251129_222821/checkpoint-768/global_step768/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b7d1631b2df1f28de29d82baa1f90876ca93b95 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-768/global_step768/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a701e65e22486e3fa18fe77d137156ec12dd81ba5982093ebd9d07dce44a7e4 +size 110803141 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-768/global_step768/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/dapo_lora_lr5_20251129_222821/checkpoint-768/global_step768/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5fdf020a60c551deab07ee50116dff984e7c5330 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-768/global_step768/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78d1ec4bcc705bf1d49b25c61cd18a76cc3bdf01f2a0137ba25781bffb4769cc +size 110803141 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-768/rng_state_0.pth b/dapo_lora_lr5_20251129_222821/checkpoint-768/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..eb2cf52f7c1372138359245cc4aa1b27f84d8347 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-768/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:616da0ef225af19875bdb16696232dba936a520710bd196e41d17a8e0946b219 +size 15365 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-768/rng_state_1.pth b/dapo_lora_lr5_20251129_222821/checkpoint-768/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..a700e24fa0c7dbe4bdad877e45a73f6918b23c6f --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-768/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6af7c7d74426fe93c369bab1cb32f8a2c3c09e9008f59e857c328f910488893e +size 15429 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-768/rng_state_2.pth b/dapo_lora_lr5_20251129_222821/checkpoint-768/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..c94829143d8ccd01d15d0cf198b4a8961169fe55 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-768/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31af9c946dc0f14da74f2a0f67f6bc671351a3605cac3c220c0d312d34e3dcff +size 15429 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-768/rng_state_3.pth b/dapo_lora_lr5_20251129_222821/checkpoint-768/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..1231f3824197ffeebf99c23bb8691e97d10a1da0 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-768/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:629ed0f622168b7111d79fcf2b1b76e1cf74e4c86b2f1523fc91389eaf659021 +size 15429 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-768/scheduler.pt b/dapo_lora_lr5_20251129_222821/checkpoint-768/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..9943fe179797fb45e7b7fb5a686591c61e54ffe0 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-768/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1edcb10cd8d45cdfc9059ec0723f6237a60d9fdbfe4869573b2dd393ec70cc8d +size 1465 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-768/tokenizer.json b/dapo_lora_lr5_20251129_222821/checkpoint-768/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..1a2db243e47cbc113f6b2ddcc388aeeb8fe1a94c --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-768/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893 +size 11422778 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-768/training_args.bin b/dapo_lora_lr5_20251129_222821/checkpoint-768/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..e78e81b63006cdc50b56c1b4072bf15526a95a70 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-768/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7dbb2821af3bd665530e3b952a48404896a15b24fe94e9581441c54cb95b8adb +size 8849 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-832/global_step832/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/dapo_lora_lr5_20251129_222821/checkpoint-832/global_step832/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b2d1e8f8ff44ab4575c3eea14e194be601a1f007 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-832/global_step832/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99958cb489a750606feca858837129f5cb9f396368469fa041354fa6dda74ddb +size 110803077 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-832/global_step832/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/dapo_lora_lr5_20251129_222821/checkpoint-832/global_step832/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c9e9c1a39af759f66866043a9cfcdc8ba09ccc8f --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-832/global_step832/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cbfff7b7b4bf7b57c61cb06438352977ba96bb8d5166136a7f508390328eb357 +size 110803077 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-832/global_step832/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/dapo_lora_lr5_20251129_222821/checkpoint-832/global_step832/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0ff7bb23b26df4309aa462e4ea482cd135d18e57 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-832/global_step832/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:caaa204fb119a1d070e8260b994d177b349320dc9fe31bb6da1500da7e2c9a4b +size 110803141 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-832/global_step832/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/dapo_lora_lr5_20251129_222821/checkpoint-832/global_step832/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e5ab8e66c20bf53c851034e2848045bea61326eb --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-832/global_step832/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:949dc19bb552a85a08f098c9cede0b6964cb002f3e28fdb615fc0e9c38fe01f0 +size 110803141 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-832/rng_state_0.pth b/dapo_lora_lr5_20251129_222821/checkpoint-832/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..79e7f1ad6694e512d115e06b8cc8caa4d000deea --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-832/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0324efdadec3ca8926df264f8e57cd144e0b6730dd25ef80c35e6c8fd6ebd38b +size 15365 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-832/rng_state_1.pth b/dapo_lora_lr5_20251129_222821/checkpoint-832/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..1db4d46a55c69b5207f43601a556869563ad06d7 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-832/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e348008dd66488a53012af426946f9adcb201804b36cc000da3bbbda87f9145 +size 15429 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-832/rng_state_2.pth b/dapo_lora_lr5_20251129_222821/checkpoint-832/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..900a449f7436a5f64b8eb74cce7f92007f25e470 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-832/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d84a2220aa1236fe38a111c0fec252b6ecd4f93d239f0c6f369e5db0117bfdd2 +size 15429 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-832/rng_state_3.pth b/dapo_lora_lr5_20251129_222821/checkpoint-832/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..e6ab052b558cddf3af73f0eab592537f4986273b --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-832/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6692b036107736df5f7589eb86b0c6a18b7bc11ef64fdf0d3beda9ccb80b440 +size 15429 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-832/scheduler.pt b/dapo_lora_lr5_20251129_222821/checkpoint-832/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..64c0dda39c077120e10d37bef913322bd622d1e6 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-832/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f645f6e3198b7fe7574a07e043338195af4a9cabf2ea64ffb9cdb8da953372e +size 1465 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-832/tokenizer.json b/dapo_lora_lr5_20251129_222821/checkpoint-832/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..1a2db243e47cbc113f6b2ddcc388aeeb8fe1a94c --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-832/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893 +size 11422778 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-832/training_args.bin b/dapo_lora_lr5_20251129_222821/checkpoint-832/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..e78e81b63006cdc50b56c1b4072bf15526a95a70 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-832/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7dbb2821af3bd665530e3b952a48404896a15b24fe94e9581441c54cb95b8adb +size 8849 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-896/global_step896/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/dapo_lora_lr5_20251129_222821/checkpoint-896/global_step896/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..11112c144eea1423ab69574ea470e7f6bdc88f02 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-896/global_step896/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3644952dafeb3bc613b8fe179abd789b70eb4bfab701570a49e2c7deef7b3288 +size 110803077 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-896/global_step896/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/dapo_lora_lr5_20251129_222821/checkpoint-896/global_step896/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..40bcf6db49f7aa53376d5a74c336d74696188f14 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-896/global_step896/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e65243ed0cda4b43aa996275828ab29d950d332a968edcae9793b559dc2c6892 +size 110803141 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-896/global_step896/mp_rank_00_model_states.pt b/dapo_lora_lr5_20251129_222821/checkpoint-896/global_step896/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d4a7edd555d8fd88470272f54661178499d66dd2 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-896/global_step896/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ffde2f5d404e2bb1301e55e66b98369fa4a28d5ad3d61a866ee5fb4c14d24215 +size 74161305 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-896/rng_state_0.pth b/dapo_lora_lr5_20251129_222821/checkpoint-896/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..910b68ebbc4ee7e4d71fa35458947fc407e82694 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-896/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c77ce12736e79145dcd0946850c65bb6673be999e483497075d844ec4e14de2 +size 15365 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-896/rng_state_1.pth b/dapo_lora_lr5_20251129_222821/checkpoint-896/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..1797f8fe9089c97566fd063e6f67f3b7ef976a91 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-896/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af7e266497fa8e260f09a3ab793c4e380a63f27830cd9ee53588c146bf20845d +size 15429 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-896/rng_state_2.pth b/dapo_lora_lr5_20251129_222821/checkpoint-896/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..b2e5fdc25724d5aaa92da9a605ebc7463d5b80ce --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-896/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18d9f6886542fa6e1a74d8ef7dbdc60ef501d9a294f641be30e05197b0dd7018 +size 15429 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-896/rng_state_3.pth b/dapo_lora_lr5_20251129_222821/checkpoint-896/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..1c8d06b9886e505c58362dd99b47ac50f10ca4cf --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-896/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ba33da6e4038ba9f3eba00e25096f19d537887e79ad001a5eea776ae266e18a +size 15429 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-896/scheduler.pt b/dapo_lora_lr5_20251129_222821/checkpoint-896/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..e7db55dec5e28c0efcc46143639a6e87c19c8947 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-896/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39fbeb77612dbf891a51991e4ea9749c5bbb627749e44c2bedec243d0473c3ae +size 1465 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-896/tokenizer.json b/dapo_lora_lr5_20251129_222821/checkpoint-896/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..1a2db243e47cbc113f6b2ddcc388aeeb8fe1a94c --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-896/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893 +size 11422778 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-896/training_args.bin b/dapo_lora_lr5_20251129_222821/checkpoint-896/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..e78e81b63006cdc50b56c1b4072bf15526a95a70 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-896/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7dbb2821af3bd665530e3b952a48404896a15b24fe94e9581441c54cb95b8adb +size 8849 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-960/adapter_model.safetensors b/dapo_lora_lr5_20251129_222821/checkpoint-960/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9ace594578120d47951be3554a1ae07547cdc04d --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-960/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd4fd552873b21ef632f631b53375597beae174e6c8724dc0082a395da0e012f +size 73911504 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-960/global_step960/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/dapo_lora_lr5_20251129_222821/checkpoint-960/global_step960/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c737ef2daeff6e7b892c55708aeef536223e6eb3 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-960/global_step960/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e786ffb3f932843c547ab9580d3098f79eee7a87a6b16844e0001b163bae2ca +size 110803077 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-960/global_step960/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/dapo_lora_lr5_20251129_222821/checkpoint-960/global_step960/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f11c01c64ad6dad86c03df19f2ca26953ba5d439 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-960/global_step960/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73041270ae020d9aca72895ad76d5dd1636b132fe23c4fb904dc30f553ef20f8 +size 110803077 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-960/global_step960/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/dapo_lora_lr5_20251129_222821/checkpoint-960/global_step960/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d86b7cf34408d90024d7b8001c085a8634954334 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-960/global_step960/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8cd072774d41137516bdc79c8fc9a8af1e210102f93252a804762d77036cced5 +size 110803141 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-960/global_step960/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/dapo_lora_lr5_20251129_222821/checkpoint-960/global_step960/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8dd62cfec452ccb9186f0f7b4831aef23aa78288 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-960/global_step960/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99fa9ed11f09968abf7b2a7593921f52dded61b7c9d9fe4c9ce117379f787b19 +size 110803141 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-960/global_step960/mp_rank_00_model_states.pt b/dapo_lora_lr5_20251129_222821/checkpoint-960/global_step960/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aabdd95b35fa4780423b2d19d1e2c441129613b4 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-960/global_step960/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b4125cec07c38a1fce6a4b98a1adb2985f3ad74fd243816eed91c5b17dee29f +size 74161305 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-960/rng_state_0.pth b/dapo_lora_lr5_20251129_222821/checkpoint-960/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..67fd650148aa01587c48e6988641f05fdef411c3 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-960/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c57ee912f4dc58a0ed5c9273c365ebf4fa9d2dc8931a0107b4ebdf3df3206de9 +size 15365 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-960/rng_state_1.pth b/dapo_lora_lr5_20251129_222821/checkpoint-960/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..5c34cb85c7ec8e9afa898279f4849e40cb3982a6 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-960/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2693809b0f00c7ff5ae5ad8902e696e7a8cb3b35bf340da11c044ef4c27b82bb +size 15429 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-960/rng_state_2.pth b/dapo_lora_lr5_20251129_222821/checkpoint-960/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..c16d3fe2ce0c9ab4c0d261169f1849c42ca3dc5c --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-960/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:830662b6e8f7401a8df32a57682593391734ef452d8f80982a2953fe99b709d6 +size 15429 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-960/rng_state_3.pth b/dapo_lora_lr5_20251129_222821/checkpoint-960/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..e18fb2062f100b5cf2bfd95ea15955e34d203f65 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-960/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b5fafd7497b23edb205852f7380275e8acc92461cd59409706af854c6192fc5 +size 15429 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-960/scheduler.pt b/dapo_lora_lr5_20251129_222821/checkpoint-960/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..256d30fa4697d069addf97c7ca9c1797cd8255fb --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-960/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7669a3a20bcd54450b2d5994eca9e1af1dfabe6a6a4726ec8d46fdecafad3a0 +size 1465 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-960/tokenizer.json b/dapo_lora_lr5_20251129_222821/checkpoint-960/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..1a2db243e47cbc113f6b2ddcc388aeeb8fe1a94c --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-960/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893 +size 11422778 diff --git a/dapo_lora_lr5_20251129_222821/checkpoint-960/training_args.bin b/dapo_lora_lr5_20251129_222821/checkpoint-960/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..e78e81b63006cdc50b56c1b4072bf15526a95a70 --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/checkpoint-960/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7dbb2821af3bd665530e3b952a48404896a15b24fe94e9581441c54cb95b8adb +size 8849 diff --git a/dapo_lora_lr5_20251129_222821/tokenizer.json b/dapo_lora_lr5_20251129_222821/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..1a2db243e47cbc113f6b2ddcc388aeeb8fe1a94c --- /dev/null +++ b/dapo_lora_lr5_20251129_222821/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893 +size 11422778 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/adapter_model.safetensors b/dapo_lora_qwen2_5_3b_20251129_022228/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..292ac25b477fa31f62c0b933b33cf190f89ac9f3 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:626cf5160857aece7f740979a86c60a2be5bbd35a8b6e85beae75be80bef1889 +size 36981856 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-1024/global_step1024/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-1024/global_step1024/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef7d2e35f18aa22fa708f5453e144630158ca3fb --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-1024/global_step1024/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d0e076b10231d2acb650ce18d4050b36ac9073fd949b9cd9c9968af686f0502 +size 55408773 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-1024/global_step1024/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-1024/global_step1024/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..67ec49aa7c694be4969acac92e5d0cd8abc04a55 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-1024/global_step1024/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b75b62dfa03b09c26b803194c40ada05b18d7a7fcee62ea5c9622cfc8e884359 +size 55408837 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-1024/global_step1024/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-1024/global_step1024/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..98906257d81346b21afc50445804e2f217321684 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-1024/global_step1024/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:714d8f4c2c0a75111b4438968c9b1c1e071516ba8c763dee15fe678c319f13c7 +size 55408837 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-1024/rng_state_0.pth b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-1024/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..102521383e922c0bf2e95a04770a8b3f0214aa7a --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-1024/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1cc334ea1cf51657d5f469851e26b8ac9d8fdf2c37850b139ef975e0daa4d574 +size 15365 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-1024/rng_state_1.pth b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-1024/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..9d95cd658ec2b4b44230183edb1e72bb574471af --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-1024/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22864b705799a5abb5ad4018200f45d3ce8a0b98f0e2d51f8bf23138f541f63b +size 15429 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-1024/rng_state_2.pth b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-1024/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..2eadb981b05f709545900fbb8c53a311d85d8b57 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-1024/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c0651270fafecb40fcb3684d4d3cebe22e6bdde3c49eb5d09cde3fc379fc2a4 +size 15429 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-1024/rng_state_3.pth b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-1024/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..61bb2819fd875bb654294bd2f1f58ba6b57e0c6d --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-1024/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b4451ce36c266c4c3b2dbd1bf3002dfae213b56efd8ae7ebafe838b8d86abe0 +size 15429 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-1024/scheduler.pt b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-1024/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..99d91d84ee7ce6fc15f8af630d20f12aec7f58eb --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-1024/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77a000cffeb82f679c5eea33f850666a8c70d17499ffc7879cf41417a213f90c +size 1465 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-1024/tokenizer.json b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-1024/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..51ebb3ba93988c73bbd83a3c163a14343fbc5b06 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-1024/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c5ae00e602b8860cbd784ba82a8aa14e8feecec692e7076590d014d7b7fdafa +size 11421896 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-1024/training_args.bin b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-1024/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..f2ef46f35127e9f6f00200bc2417ff10aaf2e7c8 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-1024/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4934408abe1007a252a69d5ce6748ee48861a0e904d53901a1aa856adf4e14c6 +size 8849 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-128/adapter_model.safetensors b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-128/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..160feb0272125fbfb23abe77670480539249daa2 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-128/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:274a1adbf90a56d8939d390c784e4ce43d43d3d127a616535defbca8e4b28719 +size 36981856 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-128/global_step128/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-128/global_step128/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eab9173f016711abe799411314a46a52c6730da6 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-128/global_step128/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:304e98a327159eca358b4e8711392e167fcde722fb24ede00bb00cd65b0364e2 +size 55408773 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-128/global_step128/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-128/global_step128/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bdbc5eaa1c8513f0c6a356b219bae3dd8752f2cc --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-128/global_step128/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1a47bb9321030728cb2ed7296ceb181bfcb1bc2bd4a5bab7ebc1b106852a615 +size 55408773 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-128/global_step128/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-128/global_step128/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..328a96cdad79aa0945373474b7d15750423c24c2 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-128/global_step128/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fffaf5f71b232ac91cb7dac2bd820d0e19fc8b0520c6c92f88155fdfbd54e24a +size 55408837 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-128/global_step128/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-128/global_step128/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fef05a72b6bc67d2ded7c27d07f8cbb5436a1920 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-128/global_step128/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25592ee322c337fc08989869bcbde0b79c38472282cbcadac586cf2dfd049b82 +size 55408837 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-128/rng_state_0.pth b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-128/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..79088b9f704b0fa271a21993c03387b7b1018e55 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-128/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aca345a24ca86fcfec59614dd6129a24a159c83580ef23088547c0616f885301 +size 15365 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-128/rng_state_1.pth b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-128/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..4e4c7f203afe559c4499a76aa0d3fa807fc447a3 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-128/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64317a59cf56e6f2190b6585e67aa4f5214af0c726a03abe4f01edb6a71df723 +size 15429 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-128/rng_state_2.pth b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-128/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..7731d448a07815d7f1bcf06759e5f5e914a16b08 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-128/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ffe5a39ac51c241ca7c052a694d7288d284ecd5ff822cd7bdb0c41b8d093fd13 +size 15429 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-128/rng_state_3.pth b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-128/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..b580186f6c80cc3e5d0660b09cac1a1ccda07541 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-128/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8fb84688ef01f05061911820d90dc33f9b7aa61f88d3a317954409a5c32d4a7d +size 15429 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-128/scheduler.pt b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-128/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d08ae64295b57090bbaa5d6676253533d838873 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-128/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a72d1751ecd37a23ecd20bd8b9260f394c2f370cb5db8d203bad7d01395f4fb8 +size 1465 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-128/tokenizer.json b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-128/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..51ebb3ba93988c73bbd83a3c163a14343fbc5b06 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-128/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c5ae00e602b8860cbd784ba82a8aa14e8feecec692e7076590d014d7b7fdafa +size 11421896 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-128/training_args.bin b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-128/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..f2ef46f35127e9f6f00200bc2417ff10aaf2e7c8 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-128/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4934408abe1007a252a69d5ce6748ee48861a0e904d53901a1aa856adf4e14c6 +size 8849 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-192/global_step192/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-192/global_step192/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..25c0561f1c3096f0f8caaa9cedeb97e2212e7384 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-192/global_step192/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:940668dce999fe2437cda2d411573275b4037924600c238ceb3e1c2b17a5f86e +size 55408773 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-192/global_step192/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-192/global_step192/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..684cc08cefc319aee9b20e8c20c59db4c259e477 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-192/global_step192/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66a21c7b6077e66362b0739cda70d13bd8b88649a91bc7c380c40ed01e0aa175 +size 55408837 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-192/global_step192/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-192/global_step192/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1837bf021b5ef57b149a61a89e4f43f9184bb98d --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-192/global_step192/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64d3a22d97f030a7bd39b1b50d71174d1c2c357756bc181e9ce6b2bb9f693b47 +size 55408837 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-192/rng_state_0.pth b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-192/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..f070b2b9908814925b09530efb1072a6d1d72107 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-192/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5804aceaab9ad3b6eb8fbb505a82e3817896a217f804f8a8eeb12840aee4192c +size 15365 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-192/rng_state_1.pth b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-192/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..3b805d61f9e4d697ca97eab73046f50725419460 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-192/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46b9b71253c6b59ae6caeadf17af774a1dd58c4a95f03ed5b029b5cd8868aab2 +size 15429 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-192/rng_state_2.pth b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-192/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..cd9d204fa51bba60b2c6dc8ffb4f49a84e58d4d9 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-192/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30ef2ebea11e95e5ea2ce43c28fd76b17400a6c9be6062e329e8f6961a116943 +size 15429 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-192/rng_state_3.pth b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-192/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..e2f54d830841aefeb9e33cdfa73c7a945a600c2e --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-192/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8c0b5cd721151807008b134bf1446d7a2baf389d2ed6331a335c97d13c0f978 +size 15429 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-192/scheduler.pt b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-192/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb4e8900ca74d271df161df3e78c5e3163d3ca2c --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-192/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ac63e93328a0491bc31c5b67747712626467b0c1fab68bd8f3a90d2ffc2d318 +size 1465 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-192/tokenizer.json b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-192/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..51ebb3ba93988c73bbd83a3c163a14343fbc5b06 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-192/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c5ae00e602b8860cbd784ba82a8aa14e8feecec692e7076590d014d7b7fdafa +size 11421896 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-192/training_args.bin b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-192/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..f2ef46f35127e9f6f00200bc2417ff10aaf2e7c8 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-192/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4934408abe1007a252a69d5ce6748ee48861a0e904d53901a1aa856adf4e14c6 +size 8849 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-256/adapter_model.safetensors b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-256/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3a2c8f68ed041b6806596d5192c05f724047ef06 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-256/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6830cbf821460a0fd8bd366e567898d7916c714abfe41f1f48d2695df40ec6b3 +size 36981856 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-256/global_step256/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-256/global_step256/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e5317f16e4c5a2a3d00ff9f5cc17a79c5cd924bf --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-256/global_step256/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1330e3d439b380fe3f8966bd63b16e1e978946f43d1019cf7a02ba987af6f177 +size 55408773 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-256/global_step256/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-256/global_step256/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..621ac047bd0ababb6113c95e01c5fa6b67fd99c4 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-256/global_step256/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c91df4bcbfa030f04ba5bc9c34fac79e37fa39f8b7c4b679b61207be9e39e3a4 +size 55408837 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-256/global_step256/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-256/global_step256/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f9e24a48a270124c942efe5ebcb2866622d8a7ef --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-256/global_step256/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e088964814bc7eecf9b805d546dbc224f2d8a3ba39b49adb0642a48029a0a6df +size 55408837 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-256/rng_state_0.pth b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-256/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..95131a87e911f5471d13fe719e94d763077abb0e --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-256/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09da07dc5276b746caafdafcd4d566a579ff73add133134606a4e813888dfa38 +size 15365 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-256/rng_state_1.pth b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-256/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..d5e03082fe3c848e9e39af12936eba19a8f978ee --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-256/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d508190fc73b73c802733995dc3f6b8b9c2958b76b0e0e80db84cea6b2feedaf +size 15429 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-256/rng_state_2.pth b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-256/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..082e0037c40f154105351adfbf3982ad7d2002e1 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-256/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:529d8f82ec7eb7c4ce3988eb35154324fbdfdaa774b55cedb4a632f45be8e7fd +size 15429 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-256/rng_state_3.pth b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-256/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..d451bd683fd3bfeddf38bef2b4a593c1d76fa488 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-256/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05cb48ce0bb054e598f885452d22e0c065b94456f995899fe59d632c5fcb54b8 +size 15429 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-256/scheduler.pt b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-256/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..5da175406e5951634027623c46687436be96a222 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-256/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8495f527d2ae384d255f961a1b604892e1f5459d17e99146a7b64167ecb9365 +size 1465 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-256/tokenizer.json b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-256/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..51ebb3ba93988c73bbd83a3c163a14343fbc5b06 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-256/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c5ae00e602b8860cbd784ba82a8aa14e8feecec692e7076590d014d7b7fdafa +size 11421896 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-256/training_args.bin b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-256/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..f2ef46f35127e9f6f00200bc2417ff10aaf2e7c8 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-256/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4934408abe1007a252a69d5ce6748ee48861a0e904d53901a1aa856adf4e14c6 +size 8849 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-320/adapter_model.safetensors b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-320/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d3141f8ad5c654f48ba67c4f235fd749df48e43e --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-320/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f77d40fe2aa3342b89d5102bfe87327dffd718d0c19811baadb00b8464c4c852 +size 36981856 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-320/global_step320/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-320/global_step320/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..94f42970daaac733645f660910d78a91c1b775b5 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-320/global_step320/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dbee3e4d55e6de7a4411e191f2fc0da1dac37f088242ef0d349947c027ebe86a +size 55408773 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-320/global_step320/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-320/global_step320/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b153c40fd12139debe0ffb8d2e2778cc9d8e456 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-320/global_step320/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:160a756a0c492451554deaa6d3e5814d3284f8a5e7ff6808b7e8ce4872aa9f21 +size 55408773 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-320/global_step320/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-320/global_step320/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..72371027ccef8f5b298e2ab638bfae457f6194a5 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-320/global_step320/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64ee0d6334786981d1ad34d7d4d757bbe9d3c6668023821d593003a2a2f372d0 +size 55408837 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-320/global_step320/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-320/global_step320/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..34a09561ec6b794c7d7e7bc85c3a170d563ecff3 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-320/global_step320/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d958f7619d9164ef727d951193f461270aae1c9e35c09e6052c248ea4b66c38 +size 55408837 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-320/rng_state_0.pth b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-320/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..3f7796a000e5f96599d69f25031fad4304c64f2f --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-320/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9953fd5296e03e92f89d8ca06a6e98c5112d0ed06d2c150ac2fb839819a36890 +size 15365 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-320/rng_state_1.pth b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-320/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..ec0e55ac604c83528d1eeb898d175045e5f3a0be --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-320/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9dce92b78533788ca9a868331e178e0137328968b9b3a7c071e29b1a87fd895f +size 15429 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-320/rng_state_2.pth b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-320/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..7b8f168c7a97b0daa09ce7c2a9b22c900957d698 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-320/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c19e82680e308ecf9ede79a93e5bbb33c262155efbb702f1c6f521b1480abdd5 +size 15429 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-320/rng_state_3.pth b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-320/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..25db8fbb64774a45acb8dd13d392c2bd44e57fb6 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-320/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82ddac2b4707aed20ce9ccc9426c8dad042baf8320489e468e7e0ee5e0681706 +size 15429 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-320/scheduler.pt b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-320/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..0b635ce1666c50e816d388484f117d6c351b92d3 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-320/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da013ae0b2b98d7666c2dc2fe7c1c09f26c72a818d58bd9b5b49a1d1f432bd5a +size 1465 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-320/tokenizer.json b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-320/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..51ebb3ba93988c73bbd83a3c163a14343fbc5b06 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-320/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c5ae00e602b8860cbd784ba82a8aa14e8feecec692e7076590d014d7b7fdafa +size 11421896 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-320/training_args.bin b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-320/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..f2ef46f35127e9f6f00200bc2417ff10aaf2e7c8 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-320/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4934408abe1007a252a69d5ce6748ee48861a0e904d53901a1aa856adf4e14c6 +size 8849 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-384/adapter_model.safetensors b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-384/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..045a9b8b90d04ea0babbc2a7d8cc87d8762394a8 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-384/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49e839bb6928a997cd808149cf11ca75586f91762ed91eb604deef5d015fcb94 +size 36981856 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-384/global_step384/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-384/global_step384/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f744d51245b9a6a3c63544ef442890fc7e176165 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-384/global_step384/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8481b8c0be55a09a25a5be7f436b2ad5f06dad28375b103e9360b5dfc216d92e +size 55408773 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-384/rng_state_0.pth b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-384/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..2f5f8a8b9ab2760d2081bf4e709a2d830bd2d6a8 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-384/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:221fc8ecca384caf9f903698cbb0a1c52c56abfebd650a5906634d93c290f09b +size 15365 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-384/rng_state_1.pth b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-384/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..ade3583b4bff810909363ca75312a8641ed9c257 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-384/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:083c1407f4e416f65edb31268fa472b84abd31a4b41f4e5630fc1182db088381 +size 15429 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-384/rng_state_2.pth b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-384/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..b0c0f835a5c26ad43442b7a7c8b1210fe9ee1c69 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-384/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2bcde77b5135577b4165dbd74d7a1ec571156be38df8bd4336b134169ef344a4 +size 15429 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-384/rng_state_3.pth b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-384/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..1ff42349e14177f7944e7395181a2a95b30f2c98 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-384/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:980a65b2d547d78fd2a1645f54ca9e4fba4efab90355f9e08dba4ca7cbdb81fd +size 15429 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-384/scheduler.pt b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-384/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..e35447364346dd4e48ff2912c9630fa0d550dd81 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-384/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a73b3132edc693a316dd18b0560b36c0fb0501d1030453a31a1309122a6bf7c +size 1465 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-384/tokenizer.json b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-384/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..51ebb3ba93988c73bbd83a3c163a14343fbc5b06 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-384/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c5ae00e602b8860cbd784ba82a8aa14e8feecec692e7076590d014d7b7fdafa +size 11421896 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-384/training_args.bin b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-384/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..f2ef46f35127e9f6f00200bc2417ff10aaf2e7c8 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-384/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4934408abe1007a252a69d5ce6748ee48861a0e904d53901a1aa856adf4e14c6 +size 8849 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-448/adapter_model.safetensors b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-448/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..abf774643ad0466ab949b0ce93aee7054104dc7e --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-448/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35b69e1adb7b4310610fa7a65de8758001992535bf82df54c7ca84d466fce8e7 +size 36981856 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-448/global_step448/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-448/global_step448/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..de36e9e2d1e4f0d3e25975a6f24b492b80a0db26 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-448/global_step448/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6f57380157ea05689f141f468f8d9bf7f1f855ba22cec828b80b6a94acce217 +size 55408837 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-448/rng_state_0.pth b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-448/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..8c3e965e86d808d1591013feb5fd9e19aae66632 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-448/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b75611645459c3769097f598468b054a7d4a05b8913080c53ffbd44f76af6cd7 +size 15365 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-448/rng_state_1.pth b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-448/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..5869c9b034d1e9cccee580e40d40c230f839f1b2 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-448/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:239178dfde70e0701f35a6fce3d0f7a52edaeb2f188e73ea3e4cc2a990ce0ef6 +size 15429 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-448/rng_state_2.pth b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-448/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..515181b3df0ee8bb249aa8b87326da50784f1215 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-448/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b84b69c8b4e08abc8cafd726d1a4349daed751d76ae5b67ec428aeeb66d1c897 +size 15429 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-448/rng_state_3.pth b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-448/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..da8636eab39734d4c46bb0e2284f50d4e7224f5e --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-448/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da92b99aadd7fb603ec5024933d9129ac9baf41a8b5dcd26669317d17e88a24f +size 15429 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-448/scheduler.pt b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-448/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a39d5aae7a5de28bbf7c8e26531da9f7f0cda3e --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-448/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89d50e6c2130ded251cbd3fb239e3a2e1e0564766292c69bfb4aa6ba0d973844 +size 1465 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-448/tokenizer.json b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-448/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..51ebb3ba93988c73bbd83a3c163a14343fbc5b06 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-448/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c5ae00e602b8860cbd784ba82a8aa14e8feecec692e7076590d014d7b7fdafa +size 11421896 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-448/training_args.bin b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-448/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..f2ef46f35127e9f6f00200bc2417ff10aaf2e7c8 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-448/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4934408abe1007a252a69d5ce6748ee48861a0e904d53901a1aa856adf4e14c6 +size 8849 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-512/adapter_model.safetensors b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-512/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ed6e60e7bb83f755f8cff15c8ac5d9645a3a68d8 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-512/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a91ac0794c8df701d6f3e4a269198ec3524e68c8d60de35be885c825e2bb23e +size 36981856 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-512/rng_state_0.pth b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-512/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..ab5c6d6372c1f0813efbc937f11c346c8b6eddd1 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-512/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35b714dbe5bcf64c23519e024b759057e374014a093efcb6bb5e101ac4e0cf0a +size 15365 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-512/rng_state_1.pth b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-512/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..16e872bd1c42e32b162cd7f9615cf76e8b97bc4a --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-512/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56e27ddaca67601bcbad3e3e13b4efa2a89ba1f359556499a0a3535b6a0f8ec9 +size 15429 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-512/rng_state_2.pth b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-512/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..17d632ff0cc683072a51686ae82136bd9bf3766c --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-512/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cdcfd81a2e81145fe0e988fef364e3dcc0d7616fcae10248ec779a5aeb8d6dfc +size 15429 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-512/rng_state_3.pth b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-512/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..30f334e3c447f91ccf1d56d31dfc5535ccb7e592 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-512/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d6e5df2ddf523f8d35a1d20fd295a230c7c3ebaee2f94d09e14dfed30ce1c6b +size 15429 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-512/tokenizer.json b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-512/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..51ebb3ba93988c73bbd83a3c163a14343fbc5b06 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-512/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c5ae00e602b8860cbd784ba82a8aa14e8feecec692e7076590d014d7b7fdafa +size 11421896 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-576/adapter_model.safetensors b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-576/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9cd7e74fcf2a0ea87aa0c4faf8c8f1f760042179 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-576/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96c57a3b3cf6cb5e5bc88337b723e693a6efebfa9b45d7249c2a7c410852e42e +size 36981856 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-576/global_step576/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-576/global_step576/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b7893c2bdada22dc74183b942daf81f0c027f587 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-576/global_step576/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3ffcb2cc5e70c67edc89ba6a135ccfc9b4a3b6ac3fc741795f61d4e609297bb +size 55408773 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-576/global_step576/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-576/global_step576/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c5b20e7c8f9d266fbfc459db5cd640165f4a721a --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-576/global_step576/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cfe9333b2799b5201e8b92513217a74a774f8f000dc5b6b2ea1343e19b0cfc64 +size 55408837 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-576/rng_state_0.pth b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-576/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..c3cc8f51774c95da2d04a00dae26dc1bb37354d2 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-576/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1fa4c023ba4432ba7c975c0e069b908c85c6fe1794ad6c5df5bdf6a0f837c0ea +size 15365 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-576/tokenizer.json b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-576/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..51ebb3ba93988c73bbd83a3c163a14343fbc5b06 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-576/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c5ae00e602b8860cbd784ba82a8aa14e8feecec692e7076590d014d7b7fdafa +size 11421896 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-64/adapter_model.safetensors b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-64/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..32d6c84640b9c5181af2c0ced464ca7e508f82ec --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-64/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:137c232971cf9ff7e3772a58a05faa378e7d7a03b490ffe85b75dc5b9a1843a5 +size 36981856 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-64/global_step64/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-64/global_step64/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bac5482300688820d490595749f090f8c0028c17 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-64/global_step64/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cdc8fd18fb0699253e7366fdbb45e93b0c7e898e3aeb370349cb9b73d7a1cf0e +size 55408837 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-64/tokenizer.json b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-64/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..51ebb3ba93988c73bbd83a3c163a14343fbc5b06 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-64/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c5ae00e602b8860cbd784ba82a8aa14e8feecec692e7076590d014d7b7fdafa +size 11421896 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-64/training_args.bin b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-64/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..f2ef46f35127e9f6f00200bc2417ff10aaf2e7c8 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-64/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4934408abe1007a252a69d5ce6748ee48861a0e904d53901a1aa856adf4e14c6 +size 8849 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-640/adapter_model.safetensors b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-640/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..440d866dd1278c972b786b4df22d786eff740830 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-640/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c287a1cb8354345958d71bb25f3eb472b3b849aa5d005d75978912cd87626c9 +size 36981856 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-640/rng_state_0.pth b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-640/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..7b64ce07a6db459f58adc38e303e5501bb37365f --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-640/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d771d0abf8214b7bc90d1a8fb94b55f8b8e7cb364d3e9e1ae1683996e8d426a +size 15365 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-640/rng_state_1.pth b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-640/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..8de011467a4a1300d8bf1dab7fb295c703c3d495 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-640/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a10c0b989a8b9901787579236642cc66d62131931f677f9a33ba44c7dd323c5 +size 15429 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-640/rng_state_2.pth b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-640/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..d91af25057bc69976657b6e1bd85b2bee78a0ac1 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-640/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a12514082f79a768110286feffab8fd0565ab2e149ede72ae5be436d4bd2f20 +size 15429 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-640/rng_state_3.pth b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-640/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..b9436ec25aa1cc209848e7ff62a89572ab78722a --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-640/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc18814a2ca4c671378dea98d0dc7a00bacf159828ce1e8f08efdc0962ed18bd +size 15429 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-640/scheduler.pt b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-640/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce72654f572f2506f27160b816a295cb0b390c16 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-640/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a218931437f4ccf43b090350bb40ee3df136a61635dc16c5ca38673a829c2bdb +size 1465 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-640/tokenizer.json b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-640/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..51ebb3ba93988c73bbd83a3c163a14343fbc5b06 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-640/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c5ae00e602b8860cbd784ba82a8aa14e8feecec692e7076590d014d7b7fdafa +size 11421896 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-640/training_args.bin b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-640/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..f2ef46f35127e9f6f00200bc2417ff10aaf2e7c8 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-640/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4934408abe1007a252a69d5ce6748ee48861a0e904d53901a1aa856adf4e14c6 +size 8849 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-704/global_step704/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-704/global_step704/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5121d5144d76de26285f96117bc7f1ddbccab8bd --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-704/global_step704/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55dae7c913e1e8f6fb7335c100308fdd01c767b28cbf15aeef36674982f0ebb5 +size 55408773 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-704/rng_state_0.pth b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-704/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..7ad40d40eb967a664d38957689d22d02e91a4fbf --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-704/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e26ee9eac765f5af360b33971c6491efba06ddd63034ae70cb1d1032b5c17f4 +size 15365 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-704/rng_state_1.pth b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-704/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..82d71fa90d799c0b7342c0765fb6762801445c83 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-704/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:315fbfbe1b8c5d477c969fe4c6460e7cc8f3fdcb70ddb38b295e2e831fd05eb3 +size 15429 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-704/rng_state_2.pth b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-704/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..eaeef4ef2ba32e85c720fba34bf5ec05bd0ca5ae --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-704/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3cde560d7183b5a8e4fe46ce47312ca1f1b6fb2bc6da491abbff8fba5749aa21 +size 15429 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-704/rng_state_3.pth b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-704/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..eaf4170f8524a9d235447e9a63ab99d3832efd33 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-704/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d959ef8c6132bf1b81da49a826a59c94321341dc8fe5b3d0ef64908bbe6611e +size 15429 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-704/scheduler.pt b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-704/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..fed940bed83776fee227b5936c168e6282b54594 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-704/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11998cc5f35748b7722fb0b2c7a077a4a3e3b00ac72b4ef20efa3259e7892c63 +size 1465 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-704/tokenizer.json b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-704/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..51ebb3ba93988c73bbd83a3c163a14343fbc5b06 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-704/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c5ae00e602b8860cbd784ba82a8aa14e8feecec692e7076590d014d7b7fdafa +size 11421896 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-704/training_args.bin b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-704/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..f2ef46f35127e9f6f00200bc2417ff10aaf2e7c8 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-704/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4934408abe1007a252a69d5ce6748ee48861a0e904d53901a1aa856adf4e14c6 +size 8849 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-768/adapter_model.safetensors b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-768/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..172b58c2998cb3deaa00bc97961b39095d69d977 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-768/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7c194a266627428192dd8910884f4279df010be912eaffac85cb0081a22f040 +size 36981856 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-768/rng_state_0.pth b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-768/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..59246ebdeaa803ab9b667eaf93b2e0639100ce67 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-768/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c05f6c5ebd35d51bdb72c2c16a130a9f255da7be543a4bfc863c67a11223d070 +size 15365 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-768/rng_state_1.pth b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-768/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..3401fab0998262e9497bd67cf08874393fd68da7 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-768/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9998e95a2e46960b01bbdc8695499efafd3b8312678e8d665e4b347a6bfe7c9 +size 15429 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-768/rng_state_2.pth b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-768/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..cea3f10718f9fd2de9dbd11d9beef4d463ce521a --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-768/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d29057ffde569aed9a2ffcbcd7a9ef31aa3cc7cc97a3efd47800ed757fe766c +size 15429 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-768/rng_state_3.pth b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-768/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..47e0773e3dcce197215ccbfb73f8fbbd49971fc3 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-768/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4efa9675a6ee16989017ea282a5b5d777a8a43aa0da245173b95fc56db0368db +size 15429 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-768/scheduler.pt b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-768/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..ba0371866ff4c56375788d8e6b6ac204eca2f3b8 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-768/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c26f336522cb69594b3952d10c9ee7899a17aa4a8eeeb9d1b384b971fa4c183 +size 1465 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-768/tokenizer.json b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-768/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..51ebb3ba93988c73bbd83a3c163a14343fbc5b06 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-768/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c5ae00e602b8860cbd784ba82a8aa14e8feecec692e7076590d014d7b7fdafa +size 11421896 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-768/training_args.bin b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-768/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..f2ef46f35127e9f6f00200bc2417ff10aaf2e7c8 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-768/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4934408abe1007a252a69d5ce6748ee48861a0e904d53901a1aa856adf4e14c6 +size 8849 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-832/rng_state_0.pth b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-832/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..15d322423f03d36113221d46049fc2619d0a0c1a --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-832/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e49c6de292fe59e58372c262351a4253e6b055950e3605be7c206d16eac0e98 +size 15365 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-832/rng_state_1.pth b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-832/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..5f5a48ebf8f0c4df77fe80a999f64ef0c3df401f --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-832/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f9ce2acc6c23c4078447d4c2076006a047a609579b9d2f14de7edaa7bdb5fd1 +size 15429 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-832/rng_state_2.pth b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-832/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..ecb0d714f9911d75746f7ea1ae96355cd9ea9d08 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-832/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1318aa7189aaed7148cdafc33991ef232c5026dd5d6bc2f55bc52cd5757611ac +size 15429 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-832/rng_state_3.pth b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-832/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..1fd4007def97b85f6166d7a60a3e21a9c5b9f7c3 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-832/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b3bf5df0215fca99656361e287b3c1f1cadcef7a3e0b9636105adbd417c84c2 +size 15429 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-832/scheduler.pt b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-832/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..8718467d126ce6bdbd53d0dbdd54da4de1ff11bf --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-832/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0d2ef8130fc98df19a3863a629f0a8a22986faed3b54d90a56462143208d671 +size 1465 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-832/tokenizer.json b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-832/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..51ebb3ba93988c73bbd83a3c163a14343fbc5b06 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-832/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c5ae00e602b8860cbd784ba82a8aa14e8feecec692e7076590d014d7b7fdafa +size 11421896 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-832/training_args.bin b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-832/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..f2ef46f35127e9f6f00200bc2417ff10aaf2e7c8 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-832/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4934408abe1007a252a69d5ce6748ee48861a0e904d53901a1aa856adf4e14c6 +size 8849 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-896/global_step896/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-896/global_step896/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..111ccb0d6e421cf3485e650ba4d02a90f35a7f3a --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-896/global_step896/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82dcdca41f4ee0cd1781212dfd61017d581870be71aab335f4c717a2a597545c +size 55408773 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-896/rng_state_0.pth b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-896/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..f793713b25a3ce63de1b7614e69292deacc9b70e --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-896/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a54d2849f8f07654e383a8ee6ab76aabf329ff3421dc302d246c9a873096193 +size 15365 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-896/rng_state_1.pth b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-896/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..9a6e1a363b96e8bcb5bca9d58a240ae4f76e563b --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-896/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b6306b2f49b245e12944fdf0a95f5fdb503c185fb2adab2a1f3b114360cdb290 +size 15429 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-896/rng_state_2.pth b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-896/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..07d104858c4cc6847201257811996b6612697292 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-896/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:88c33b2d2304a06390632a67a1f7565d8a8dbc00c0112a19be288b5332dd96ba +size 15429 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-896/rng_state_3.pth b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-896/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..d9ce7c621d3a5375a96d5217dec6c4b1d6eb43cf --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-896/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:116d60548380a902bb1ef6673cca21849a3f93fd00dcaaaea28411d931535935 +size 15429 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-896/scheduler.pt b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-896/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..5b4ecb0ccba616e482f4a3ec4b8e0a53368e6fbf --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-896/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8bfb7bfa2c34c711580edf233de0f324b5ef962a780aa91f27b4eb576e2588ab +size 1465 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-896/tokenizer.json b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-896/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..51ebb3ba93988c73bbd83a3c163a14343fbc5b06 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-896/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c5ae00e602b8860cbd784ba82a8aa14e8feecec692e7076590d014d7b7fdafa +size 11421896 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-896/training_args.bin b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-896/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..f2ef46f35127e9f6f00200bc2417ff10aaf2e7c8 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-896/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4934408abe1007a252a69d5ce6748ee48861a0e904d53901a1aa856adf4e14c6 +size 8849 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-960/adapter_model.safetensors b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-960/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4c8dfa04ae72252d993d34cb5d559c332c89bc6a --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-960/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d783f5edfc4480933a72088cbb07fd12fadb9b0093287a33949f461c69ef3686 +size 36981856 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-960/rng_state_0.pth b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-960/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..9f247d3f288fe2df2bf83c2c0215acbb627eced3 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-960/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d28321726bc471b4edd01dc18fb8e63142091ce4c621b9911a529303e9bbf705 +size 15365 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-960/rng_state_1.pth b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-960/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..0fb058a6821a6dd1196425731a9176dc855ddd2d --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-960/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3f293e7b160532f9a2c9cbdb99bf7e7c6d66ac80d1c5446a83496d763e69376 +size 15429 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-960/rng_state_2.pth b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-960/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..a8e98115159494d962191be83feb49efd13df4eb --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-960/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71da3e58edd1782c54291e928b880dd178ceb8dab179eebfc4ca0357dceeab65 +size 15429 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-960/rng_state_3.pth b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-960/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..cb8288df06f6d46ac39ec100acb5019f9b82bca6 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-960/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9488866fbc8d2daadf8f124e50ccdc492c56e533d3a680d9c29928125e90174 +size 15429 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-960/scheduler.pt b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-960/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..9eb04204506c94bd661dad83fc4b7f80d132d458 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-960/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0745cbdd2c0a3caae7131e38e031d01350e2e6b8404ec309e908eeec7592a96 +size 1465 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-960/tokenizer.json b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-960/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..51ebb3ba93988c73bbd83a3c163a14343fbc5b06 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-960/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c5ae00e602b8860cbd784ba82a8aa14e8feecec692e7076590d014d7b7fdafa +size 11421896 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-960/training_args.bin b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-960/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..f2ef46f35127e9f6f00200bc2417ff10aaf2e7c8 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-960/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4934408abe1007a252a69d5ce6748ee48861a0e904d53901a1aa856adf4e14c6 +size 8849 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/tokenizer.json b/dapo_lora_qwen2_5_3b_20251129_022228/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..51ebb3ba93988c73bbd83a3c163a14343fbc5b06 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c5ae00e602b8860cbd784ba82a8aa14e8feecec692e7076590d014d7b7fdafa +size 11421896 diff --git a/dapo_lora_qwen2_5_3b_20251129_022228/training_args.bin b/dapo_lora_qwen2_5_3b_20251129_022228/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..f2ef46f35127e9f6f00200bc2417ff10aaf2e7c8 --- /dev/null +++ b/dapo_lora_qwen2_5_3b_20251129_022228/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4934408abe1007a252a69d5ce6748ee48861a0e904d53901a1aa856adf4e14c6 +size 8849 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-1024/rng_state_0.pth b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-1024/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..c3e4fb8eeda7e4139c4f0471e3aa2b04de58011a --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-1024/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a86a77fc531590869b380b97be8fcad5a5a18277bcce3fc055fdb31e67de1d43 +size 15365 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-1024/rng_state_2.pth b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-1024/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..dc1b5cc3e7177b20c2161f2e34d12ca18e7986a3 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-1024/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9ff0ef8955c12282aec1f70008da86ff4536ca85c59d00e39b65ffcd14c0ef1 +size 15429 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-1024/rng_state_3.pth b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-1024/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..74cf9e98d8a233c3715b44602825fc132dddb85a --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-1024/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27e5858d9996b1854b1341f2ec17e98d5296b5eaffa8fa9030f717966b307002 +size 15429 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-1024/scheduler.pt b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-1024/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..99d91d84ee7ce6fc15f8af630d20f12aec7f58eb --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-1024/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77a000cffeb82f679c5eea33f850666a8c70d17499ffc7879cf41417a213f90c +size 1465 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-1024/tokenizer.json b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-1024/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..1a2db243e47cbc113f6b2ddcc388aeeb8fe1a94c --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-1024/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893 +size 11422778 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-128/rng_state_0.pth b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-128/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..6d09b8210d74252984f8e4ac2359ad5d598a519d --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-128/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae1ea4e3cb0530b7d09b5cad27f01df3c551b541aa42ef4737415166a5625a4a +size 15365 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-128/rng_state_1.pth b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-128/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..783f60a0a9b54b3328e293ee1ef63b508a82cbc2 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-128/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8307c9b7f97f69f698b68269479f250717d1dd7dbd735a052b7c853aac4afbd7 +size 15429 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-128/rng_state_3.pth b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-128/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..34f8136a8709a963bc582833bff30449c931afec --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-128/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3b178326b6060c2bfa9697a5b1a7987e8d6f39b832a395c278a9532c6a226ab +size 15429 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-128/scheduler.pt b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-128/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d08ae64295b57090bbaa5d6676253533d838873 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-128/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a72d1751ecd37a23ecd20bd8b9260f394c2f370cb5db8d203bad7d01395f4fb8 +size 1465 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-128/tokenizer.json b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-128/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..1a2db243e47cbc113f6b2ddcc388aeeb8fe1a94c --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-128/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893 +size 11422778 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-128/training_args.bin b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-128/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..2a32527c071ce3323255d067df17ab72b228551e --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-128/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7cc479e21276b308c8f336b99be02d5fb11c440dea3134eaff10d6dfd8a99cb +size 8849 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-192/rng_state_0.pth b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-192/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..2efdba0c8990292ed841d91849ac0f3d63bb33ad --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-192/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c73ac2d5db8027d7db6748ddf1f26d0e9d3e88d07d316b168eb63db88c96289 +size 15365 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-192/rng_state_1.pth b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-192/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..5675823eefc48bca956726e212af3c081d5b2723 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-192/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cecbf4c5b68cc0da07f534e153789d2ea9d18ac9a3a8a14f8edddd0ea181585e +size 15429 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-192/rng_state_2.pth b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-192/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..85bfd4f10ed32a6173d6f52cc8f5c918a600cb7a --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-192/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2c686a8bf2789487c29c31b2ef20160cb3ecfe781a6df0838a6b4e92f07647a +size 15429 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-192/rng_state_3.pth b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-192/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..1316dcbdbc387ba5ad4cb72c9d11c48881af6187 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-192/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb7158e21ae4a1156220ad310ab00979254f0158ccdfc4a8686fd100d0422bf7 +size 15429 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-192/scheduler.pt b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-192/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb4e8900ca74d271df161df3e78c5e3163d3ca2c --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-192/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ac63e93328a0491bc31c5b67747712626467b0c1fab68bd8f3a90d2ffc2d318 +size 1465 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-192/tokenizer.json b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-192/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..1a2db243e47cbc113f6b2ddcc388aeeb8fe1a94c --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-192/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893 +size 11422778 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-192/training_args.bin b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-192/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..2a32527c071ce3323255d067df17ab72b228551e --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-192/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7cc479e21276b308c8f336b99be02d5fb11c440dea3134eaff10d6dfd8a99cb +size 8849 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-256/global_step256/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-256/global_step256/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c67dca8b843741915321dcab82bbf7ea97c479e0 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-256/global_step256/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f92f7cdab7be9885b9c959e1628646e6c3951621ede131d5ca90d55a8107139 +size 55408773 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-256/global_step256/mp_rank_00_model_states.pt b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-256/global_step256/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad0a5da0642b8c0dbbac258e05d0d9b7c07ac731 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-256/global_step256/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0b50628a248c301a7c061697547831f54666223ccea2be4421abc6557a0fd61 +size 37231769 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-256/rng_state_0.pth b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-256/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..f8a5e458f68563ad9166120d151f8441fb42de77 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-256/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a11e9f5316d172664aefe72ffa04513a8646696d441fd9d21f32b4404c0e632a +size 15365 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-256/rng_state_1.pth b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-256/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..bd303d356789aa89e3942c18d9dd5a7888d94d19 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-256/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8af01a16fe4edcb47e521510c475077abf4f16e6174c666575df5f00bbbf0c5b +size 15429 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-256/rng_state_2.pth b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-256/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..1fe2b4b3301c0c909ce50e8b0024c45c544759d1 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-256/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:322d9052deb4e29617e899a8f300e3dedceaa10bc8b1bac576ce41162f21f802 +size 15429 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-256/rng_state_3.pth b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-256/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..b9d2b8fcdb09af679afd66bdc3fb62ada4452d33 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-256/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f35250122a647adb9e9fcb34d4e395727448aef414ac429477d12dda43d576f1 +size 15429 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-256/scheduler.pt b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-256/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..5da175406e5951634027623c46687436be96a222 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-256/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8495f527d2ae384d255f961a1b604892e1f5459d17e99146a7b64167ecb9365 +size 1465 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-256/training_args.bin b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-256/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..2a32527c071ce3323255d067df17ab72b228551e --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-256/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7cc479e21276b308c8f336b99be02d5fb11c440dea3134eaff10d6dfd8a99cb +size 8849 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-320/global_step320/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-320/global_step320/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5af8ed1713f50c582565a938b7aa7f9a158d49b3 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-320/global_step320/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ea245a640ac3a1bfaecc0c3d458b04022ac54efe3b0f0495990ca51709a6566 +size 55408773 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-320/rng_state_0.pth b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-320/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..84c3523197ff10a71acb7bc9fce0161f589c199f --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-320/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06985dc773c540d2bfb9876ba0600c2b5904c077579fa1b8957d75c801b891b7 +size 15365 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-320/rng_state_1.pth b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-320/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..8c9fa119f80fed09494e7df7e52e0fcb5ab83887 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-320/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df1dec6070cfde03e21d21bed49abc4d5777afdff918e89d538ddbdf6ada7f86 +size 15429 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-320/rng_state_2.pth b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-320/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..7a58b8eae4650875594f4852403793c4788d1811 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-320/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7df415f01f10a662b1a20cea5cde49b7d4283a704ff51f0bbae9d331eddc024e +size 15429 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-320/rng_state_3.pth b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-320/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..c1b849200b8eaee38b00e323d510cc7cbfb8f765 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-320/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:52bf598c7076ed5ae467b865f74e7ab827e0f1ae899b3bfe4350387fc1f883cd +size 15429 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-320/scheduler.pt b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-320/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..0b635ce1666c50e816d388484f117d6c351b92d3 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-320/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da013ae0b2b98d7666c2dc2fe7c1c09f26c72a818d58bd9b5b49a1d1f432bd5a +size 1465 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-384/global_step384/mp_rank_00_model_states.pt b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-384/global_step384/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..85637dda1ccec42e1d9e6e9fa96e8048df5419d0 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-384/global_step384/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c47b5ce31dc5b6a84d04157a02c90cf62c1984255b38e7142693723b087b5db +size 37231769 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-384/rng_state_1.pth b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-384/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..53df5872ef2595082b7f0cae87b870caceb68288 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-384/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5c0dd6f7380e8948a2d24ac5fe9a23b769dfe6bbaedfce33effa5883fb5189d +size 15429 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-384/rng_state_2.pth b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-384/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..1b2077da9e91317fa7438312bdeb54d12586e9dc --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-384/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29537953c0d4cc87f3c26ebff2f231c7d6dc4211bfc88647be77a110f33255ca +size 15429 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-448/global_step448/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-448/global_step448/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2f3f7f5b04084713adea9b694fea4fc9005edf74 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-448/global_step448/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6545fe78510057f88e9856705c36f59609b9876a243e9c5ca60ece9b0daf14d6 +size 55408773 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-448/global_step448/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-448/global_step448/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..103a8b7fa82ffb046beafe54847c7b393452b58f --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-448/global_step448/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d66d948baa83521f50271acd3c3bda2b4e825af193af205e614640cfe72696b3 +size 55408773 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-512/global_step512/mp_rank_00_model_states.pt b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-512/global_step512/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8c002e692d022f9ba55fefc85b22de1b76b666f9 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-512/global_step512/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8050eb0a0407cd567071f5752ab0e4b1569256d19731df7fa4e91ce07ca0f0e +size 37231769 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-576/global_step576/mp_rank_00_model_states.pt b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-576/global_step576/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ffe2824813057abb5f9e1d5bdf8ece469d9a6af1 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-576/global_step576/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:622af3f823680f0597d7354d8b8c6ae5bab8e677714c14857647689ce132e0c5 +size 37231769 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-576/rng_state_2.pth b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-576/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..d60d0316f6ce9b81f75c64992f65ac622c9e87a0 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-576/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5f8dea26648b496ffc946e233a6e7699e1295d7c7fdea269ed2102a1d86b765 +size 15429 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-576/training_args.bin b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-576/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..2a32527c071ce3323255d067df17ab72b228551e --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-576/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7cc479e21276b308c8f336b99be02d5fb11c440dea3134eaff10d6dfd8a99cb +size 8849 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-64/rng_state_1.pth b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-64/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..de90a5d940b70142bd2500aeef06dcf3e0768280 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-64/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90a7ed834524b5695781dce0b0a908b5247039565042a6d49df73637f8e2e448 +size 15429 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-64/rng_state_2.pth b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-64/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..7e9f69f44ddbdf4a698e695b8f3d97fa0c0972f6 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-64/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0423ba3279c4971b11bc329afdb52310ef434cbffc05f906712b8a897f3bc085 +size 15429 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-64/rng_state_3.pth b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-64/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..5c4834f685a59e51c45da21b5dfdd7b445d59460 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-64/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8914f973db19534e42abc820f54787fa0c23fa8da74fd7113efb7c2adb7dbe2 +size 15429 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-64/tokenizer.json b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-64/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..1a2db243e47cbc113f6b2ddcc388aeeb8fe1a94c --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-64/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893 +size 11422778 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-640/adapter_model.safetensors b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-640/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..60375cfbd376b0431001ffe5c84bd4d584101cf3 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-640/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a01726d2f367e26dd0fc496fb96826a6e6e104457c056f87cc55dec29a226e8a +size 36981856 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-640/global_step640/mp_rank_00_model_states.pt b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-640/global_step640/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..721133b034a9a34cacd28fde17a96ac081064df7 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-640/global_step640/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3aa5de89bbc8a5277c9fbeb579462965569dfa55720726e7e496fb6ff13f8445 +size 37231769 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-640/rng_state_0.pth b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-640/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..ef58ce6110544227be7c46fb3e22e1c3133f8f56 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-640/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70c517b0274f4b25bbc095472066ccb08f546081ee806a07abb0c52ecb64ddc6 +size 15365 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-640/tokenizer.json b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-640/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..1a2db243e47cbc113f6b2ddcc388aeeb8fe1a94c --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-640/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893 +size 11422778 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-704/adapter_model.safetensors b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-704/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..53a1d60b3bbf97ebf77d8a87b5361858bc309f3f --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-704/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa8cf44842c1141e6bab9baa0de5394f0ac90c9a713c49018c0150d15e1774fa +size 36981856 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-704/rng_state_1.pth b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-704/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..7799abbba2f315339bc75fe16a7cc48f2d4098dd --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-704/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b516c58ea6ef8aaf72f6b70eb8a556367d794edb11724ed47c56ec58a61f54a +size 15429 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-704/rng_state_2.pth b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-704/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..939b9b4016cba829a3d9efd48a38ece173b8a113 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-704/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ceb02a34cf26846ce78c036ab013679dc726a5d13d8e2f9085bca9e7d950a3d9 +size 15429 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-704/tokenizer.json b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-704/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..1a2db243e47cbc113f6b2ddcc388aeeb8fe1a94c --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-704/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893 +size 11422778 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-704/training_args.bin b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-704/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..2a32527c071ce3323255d067df17ab72b228551e --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-704/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7cc479e21276b308c8f336b99be02d5fb11c440dea3134eaff10d6dfd8a99cb +size 8849 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-768/rng_state_0.pth b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-768/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..43510a5dd770991ca3034451d6baccdf737442d6 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-768/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:845c03b2fd51d00f60339e7092d9709c359a8892453f6c931020f92b63690f45 +size 15365 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-768/rng_state_2.pth b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-768/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..e1a77d836a1ffe13f7f699767c5270e32850724e --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-768/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7dbf0acaac98ef135c9f5cdcc387eedc31d62dcb712317bca36268a611cc40e9 +size 15429 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-768/rng_state_3.pth b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-768/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..fa2cc0ec753e282e0c1c51c676b9348dd73ed61e --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-768/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a183d479371447a6cc4d0e3bbb9766cb421aa5ab497d8ebec6853b4768b3ee0 +size 15429 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-768/scheduler.pt b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-768/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..ba0371866ff4c56375788d8e6b6ac204eca2f3b8 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-768/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c26f336522cb69594b3952d10c9ee7899a17aa4a8eeeb9d1b384b971fa4c183 +size 1465 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-768/tokenizer.json b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-768/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..1a2db243e47cbc113f6b2ddcc388aeeb8fe1a94c --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-768/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893 +size 11422778 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-832/rng_state_0.pth b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-832/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..d02384e19d1483b4147b625da3ecd59ec1dd358d --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-832/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c171501c8c4040b8bda7bd8bc8ae3d73e992d9e5f0ce90ebf1a6f1ab2cd716a +size 15365 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-832/rng_state_1.pth b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-832/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..d59af1d14bd6bb8beac363905bd1ab54da1a04cd --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-832/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21b1699d61af1da4d67aa783226a1a264e215fa4ef845f0dd22bf211a7fa79cb +size 15429 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-832/rng_state_2.pth b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-832/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..9bbea3d6e3f17951a74ea471e24f686848128279 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-832/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9734ab28d62b36d81a8bf4178e928599c2e464e01b9f89826d759aec9f8a357a +size 15429 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-832/rng_state_3.pth b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-832/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..895c260fd7fca551f519b4f128bf68f6568a5610 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-832/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9eb2981cb524c1339a382d54869e58f4f44793e36ede98d8065ec2a9e1bdde66 +size 15429 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-832/scheduler.pt b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-832/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..8718467d126ce6bdbd53d0dbdd54da4de1ff11bf --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-832/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0d2ef8130fc98df19a3863a629f0a8a22986faed3b54d90a56462143208d671 +size 1465 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-832/tokenizer.json b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-832/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..1a2db243e47cbc113f6b2ddcc388aeeb8fe1a94c --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-832/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893 +size 11422778 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-832/training_args.bin b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-832/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..2a32527c071ce3323255d067df17ab72b228551e --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-832/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7cc479e21276b308c8f336b99be02d5fb11c440dea3134eaff10d6dfd8a99cb +size 8849 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-896/rng_state_0.pth b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-896/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..caee91afabb099795784c980a183dbf029c78091 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-896/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:65b6f0b37579b2fc732cf5a250459b43036e2efad796994a7cf40fe84f30a7b5 +size 15365 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-896/rng_state_1.pth b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-896/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..320879190031d993b4d81cfc0fe57a9debd45860 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-896/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22f73c8379b6e361c5018b1067c0687ed86d5c4ceeea2f992e0d285c1aa4a902 +size 15429 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-896/rng_state_2.pth b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-896/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..4e14fa95efc1fc739a70d1c0dd6564c5fac61d58 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-896/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2d00657f466f400d334cc8661a6b9624bec9f2778caf33fdd349e1d83649c6b +size 15429 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-896/rng_state_3.pth b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-896/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..b210bee5496abbc52a68c46ff037ea5f5bbf7eb2 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-896/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59e46d387f99855e298a36d3f5a379eb9fef99e1251d091df2bc4e0b2a10a6b3 +size 15429 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-896/scheduler.pt b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-896/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..5b4ecb0ccba616e482f4a3ec4b8e0a53368e6fbf --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-896/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8bfb7bfa2c34c711580edf233de0f324b5ef962a780aa91f27b4eb576e2588ab +size 1465 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-896/training_args.bin b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-896/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..2a32527c071ce3323255d067df17ab72b228551e --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-896/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7cc479e21276b308c8f336b99be02d5fb11c440dea3134eaff10d6dfd8a99cb +size 8849 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-960/rng_state_0.pth b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-960/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..8146c980e72c499f8eb94d884151c328277a85f4 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-960/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c62012f3790fb7c9d5dae43463b6f86f8233d0618155e2166f1e6f2d6c3b354d +size 15365 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-960/rng_state_1.pth b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-960/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..ad73d2f1de442d359cc7e6a72c02b8c0a79c4cd3 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-960/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2eb78d0f42da2ac10998c8f328729160291e9d7448e1e0a8c5e01c924070097 +size 15429 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-960/rng_state_2.pth b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-960/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..c33aeb025d2be25e01772a6b8b0a0e7a4b517b98 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-960/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:776719d14871ebcac53883059aec98a97a3581308d81e57f45748da08fe322a6 +size 15429 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-960/rng_state_3.pth b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-960/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..86ddb32828a8459a848ee5038e2b33e6b3766bd4 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-960/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8b4eb6f51b705a4a9682fd8e3e8e9973e5c966879d27614735052703863f615 +size 15429 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-960/scheduler.pt b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-960/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..9eb04204506c94bd661dad83fc4b7f80d132d458 --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-960/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0745cbdd2c0a3caae7131e38e031d01350e2e6b8404ec309e908eeec7592a96 +size 1465 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-960/training_args.bin b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-960/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..2a32527c071ce3323255d067df17ab72b228551e --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-960/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7cc479e21276b308c8f336b99be02d5fb11c440dea3134eaff10d6dfd8a99cb +size 8849 diff --git a/dapo_lora_r16_qwen2_5_3b_20251124_104900/tokenizer.json b/dapo_lora_r16_qwen2_5_3b_20251124_104900/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..1a2db243e47cbc113f6b2ddcc388aeeb8fe1a94c --- /dev/null +++ b/dapo_lora_r16_qwen2_5_3b_20251124_104900/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893 +size 11422778 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-1024/rng_state_0.pth b/dapo_lora_r8_20251129_135342/checkpoint-1024/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..41cfbe42c4491352e7c2b6f0aadb7aca23891ec4 --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-1024/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50e736f68ce66e419bafee1470e16a29fe2c923a763449dc89288fd79863fd26 +size 15365 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-1024/rng_state_1.pth b/dapo_lora_r8_20251129_135342/checkpoint-1024/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..8edeec36004f61699b84457bec0e057ad4a99c4d --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-1024/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dff7119324230b0d598a06a9b09cbb29c60876d3db3f08e051162b8caf28044c +size 15429 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-1024/rng_state_2.pth b/dapo_lora_r8_20251129_135342/checkpoint-1024/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..0104924759fdbb51a48c3271c53354066bf4287e --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-1024/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f56ca6e4a6d86739463fb9cea62e456f640808c74f72cc7944ba80b4ae799a3 +size 15429 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-1024/rng_state_3.pth b/dapo_lora_r8_20251129_135342/checkpoint-1024/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..b2628e9b2d57e99b8a703191967904bcf87f9b18 --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-1024/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53c97b22a54e5d80480acada09bbaf601d7704454f3ab881de6910419daa0ffd +size 15429 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-1024/training_args.bin b/dapo_lora_r8_20251129_135342/checkpoint-1024/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..489d1fc6a9879879650b9a0275141e44deaac832 --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-1024/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e591d12c15a6576f59af6858dbccfa77b59d60b21ef7a813c92a6711b9106af5 +size 8849 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-128/rng_state_0.pth b/dapo_lora_r8_20251129_135342/checkpoint-128/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..3ea58d1827d81871a3025db0ec1f4c7ff5509762 --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-128/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9696394a2ba0275d1cea6c790c677675eb24731c6c02dcbd5923302540035f88 +size 15365 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-128/rng_state_2.pth b/dapo_lora_r8_20251129_135342/checkpoint-128/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..f2b6d58395b6b609571fab3dbdaa848dd5daf55f --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-128/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b234788a7cc4f78dc3bfab3f2b1ecc4815d81933b105b1c9c6c90c3a119e4d0 +size 15429 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-128/scheduler.pt b/dapo_lora_r8_20251129_135342/checkpoint-128/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d08ae64295b57090bbaa5d6676253533d838873 --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-128/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a72d1751ecd37a23ecd20bd8b9260f394c2f370cb5db8d203bad7d01395f4fb8 +size 1465 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-768/global_step768/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/dapo_lora_r8_20251129_135342/checkpoint-768/global_step768/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d4d8fdcd0be05ab5225070ed40f98d533adf3f30 --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-768/global_step768/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aaaee58116d0f10d34164ff27d6acf62c6764f75f94d18b5856d00d361aa7d83 +size 27711685 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-896/global_step896/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/dapo_lora_r8_20251129_135342/checkpoint-896/global_step896/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ebeb85c6617b3d8c83889e1551444b2b6cc68774 --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-896/global_step896/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2cea82a90dae8c6c18092b71de98c8aad7333133de909fcf1d49cdc0c9e5d251 +size 27711685 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-896/global_step896/mp_rank_00_model_states.pt b/dapo_lora_r8_20251129_135342/checkpoint-896/global_step896/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..61ef5c801576992c82e9936752f5db5a892fab19 --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-896/global_step896/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cad3f0a2f4089f34e01ff3e47697b976411f35e5583e19e05b292d5b9fb3eab3 +size 18767001 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-960/global_step960/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/dapo_lora_r8_20251129_135342/checkpoint-960/global_step960/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b9c44dbde9eac7235b86ca2a754d2df76f9d5998 --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-960/global_step960/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98a80fb8813c5fb8472f01bd58e17797d686dc6d3b17928f0b6d4495b43d3248 +size 27711557 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-960/global_step960/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/dapo_lora_r8_20251129_135342/checkpoint-960/global_step960/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a50a74590ceacce703726e46e6c36a59a9ca7fbc --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-960/global_step960/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb030c11cd837d9dcbe3795f75c95322a9c6c2cafc4c839d4cc7bfdbb0422c66 +size 27711685 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-960/global_step960/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/dapo_lora_r8_20251129_135342/checkpoint-960/global_step960/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aeb8120ad4e1bdc05f076f6e673e1d67f2ff7b9b --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-960/global_step960/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db19b406fdb59dd8f3763a7ff0725b1a6b281f62600a43128ccba10f11c3f541 +size 27711685 diff --git a/dapo_lora_r8_20251129_135342/checkpoint-960/global_step960/mp_rank_00_model_states.pt b/dapo_lora_r8_20251129_135342/checkpoint-960/global_step960/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..210f8ba8a3336ef1d49a7da5bb1155a3de8fb6dd --- /dev/null +++ b/dapo_lora_r8_20251129_135342/checkpoint-960/global_step960/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:62865e5f1165a9e420c77d5be0669d20bd3d09953b64cab14a860e83d66aa338 +size 18767001 diff --git a/dapo_lora_r8_20251129_135342/training_args.bin b/dapo_lora_r8_20251129_135342/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..489d1fc6a9879879650b9a0275141e44deaac832 --- /dev/null +++ b/dapo_lora_r8_20251129_135342/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e591d12c15a6576f59af6858dbccfa77b59d60b21ef7a813c92a6711b9106af5 +size 8849 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/adapter_model.safetensors b/dapo_milora_qwen2_5_1_5b_20251126_224006/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3dee4cd6c8d7c2347ddc633f99eb0d78502ebea8 --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef81f07eada542b0beb31271a437a008ad2819bc79b587c749041f1b940e7dcc +size 49582616 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-1024/adapter_model.safetensors b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-1024/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3dee4cd6c8d7c2347ddc633f99eb0d78502ebea8 --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-1024/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef81f07eada542b0beb31271a437a008ad2819bc79b587c749041f1b940e7dcc +size 49582616 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-1024/global_step1024/mp_rank_00_model_states.pt b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-1024/global_step1024/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..707d1d59973e5a17b3054910781fd56c2b6d6a5b --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-1024/global_step1024/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82dc67fa4e790caddceb4fcf31baeec15239662cc6da3ecb8a8ed77c84c02d8c +size 49768921 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-320/tokenizer.json b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-320/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..1a2db243e47cbc113f6b2ddcc388aeeb8fe1a94c --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-320/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893 +size 11422778 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-384/tokenizer.json b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-384/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..1a2db243e47cbc113f6b2ddcc388aeeb8fe1a94c --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-384/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893 +size 11422778 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-512/tokenizer.json b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-512/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..1a2db243e47cbc113f6b2ddcc388aeeb8fe1a94c --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-512/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893 +size 11422778 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-576/tokenizer.json b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-576/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..1a2db243e47cbc113f6b2ddcc388aeeb8fe1a94c --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-576/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893 +size 11422778 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-64/tokenizer.json b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-64/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..1a2db243e47cbc113f6b2ddcc388aeeb8fe1a94c --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-64/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893 +size 11422778 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-640/tokenizer.json b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-640/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..1a2db243e47cbc113f6b2ddcc388aeeb8fe1a94c --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-640/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893 +size 11422778 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-704/tokenizer.json b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-704/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..1a2db243e47cbc113f6b2ddcc388aeeb8fe1a94c --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-704/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893 +size 11422778 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-768/tokenizer.json b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-768/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..1a2db243e47cbc113f6b2ddcc388aeeb8fe1a94c --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-768/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893 +size 11422778 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-832/tokenizer.json b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-832/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..1a2db243e47cbc113f6b2ddcc388aeeb8fe1a94c --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-832/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893 +size 11422778 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-896/tokenizer.json b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-896/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..1a2db243e47cbc113f6b2ddcc388aeeb8fe1a94c --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-896/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893 +size 11422778 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-896/training_args.bin b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-896/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..28b57c2433d1f782fd9d6a2d566eacd7c01306ca --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-896/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6e763c53379e58f5e941c941cb9ff1e9ea6ce682340ae670fa6af4ad661a269 +size 8849 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-960/rng_state_1.pth b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-960/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..b0c3c8b22069abfb4133ce899de8c13ee1183a2f --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-960/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:713555d67a7659e632a8a8703416a26ce646cc7cef929785f352142190698188 +size 15429 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-960/scheduler.pt b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-960/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..9eb04204506c94bd661dad83fc4b7f80d132d458 --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-960/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0745cbdd2c0a3caae7131e38e031d01350e2e6b8404ec309e908eeec7592a96 +size 1465 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-960/tokenizer.json b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-960/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..1a2db243e47cbc113f6b2ddcc388aeeb8fe1a94c --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-960/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893 +size 11422778 diff --git a/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-960/training_args.bin b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-960/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..28b57c2433d1f782fd9d6a2d566eacd7c01306ca --- /dev/null +++ b/dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-960/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6e763c53379e58f5e941c941cb9ff1e9ea6ce682340ae670fa6af4ad661a269 +size 8849 diff --git a/dapo_miss_openmath_20251129_124147/checkpoint-1024/rng_state_0.pth b/dapo_miss_openmath_20251129_124147/checkpoint-1024/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..fa22c5d9c995fb1b2402c884ba48d4d2b4fa1a9c --- /dev/null +++ b/dapo_miss_openmath_20251129_124147/checkpoint-1024/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:481c25db9999a5e1478e8023d88246d776000d460151cb8092c88bf239f71393 +size 15365 diff --git a/dapo_miss_openmath_20251129_124147/checkpoint-1024/rng_state_1.pth b/dapo_miss_openmath_20251129_124147/checkpoint-1024/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..89e6fd5c9373c1a5631ee43b4fc4dc213d094fdb --- /dev/null +++ b/dapo_miss_openmath_20251129_124147/checkpoint-1024/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e7a6b7223617d92c2bdf4dcccb0de3dfac491d0138490120e74a8038e9dcb51 +size 15429 diff --git a/dapo_miss_openmath_20251129_124147/checkpoint-1024/rng_state_2.pth b/dapo_miss_openmath_20251129_124147/checkpoint-1024/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..9e9efb25ffdf8d532a07ab74843aa110f6d8d7fe --- /dev/null +++ b/dapo_miss_openmath_20251129_124147/checkpoint-1024/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa52e36cbfcc87ab95efa1a1863c66c29d5aa8544dfae7f70e10f050f9c27921 +size 15429 diff --git a/dapo_miss_openmath_20251129_124147/checkpoint-1024/rng_state_3.pth b/dapo_miss_openmath_20251129_124147/checkpoint-1024/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..57832b383285259e89a31543b2cf56ccc715ae29 --- /dev/null +++ b/dapo_miss_openmath_20251129_124147/checkpoint-1024/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e73bb1bc19fcc85e9609261022a1603b9ff3b657c64ceb8ad8e2dd0ac5e65c24 +size 15429 diff --git a/dapo_miss_openmath_20251129_124147/checkpoint-1024/scheduler.pt b/dapo_miss_openmath_20251129_124147/checkpoint-1024/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..99d91d84ee7ce6fc15f8af630d20f12aec7f58eb --- /dev/null +++ b/dapo_miss_openmath_20251129_124147/checkpoint-1024/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77a000cffeb82f679c5eea33f850666a8c70d17499ffc7879cf41417a213f90c +size 1465 diff --git a/dapo_miss_openmath_20251129_124147/checkpoint-1024/training_args.bin b/dapo_miss_openmath_20251129_124147/checkpoint-1024/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..4aaf77970b3dff8064090e296d624d3538978ae9 --- /dev/null +++ b/dapo_miss_openmath_20251129_124147/checkpoint-1024/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c5c215d84703cfc98ad11de2d9f07cdf4b5dc3343d7447f227ef9ac39f64c06 +size 8849 diff --git a/dapo_miss_openmath_20251129_124147/checkpoint-128/rng_state_0.pth b/dapo_miss_openmath_20251129_124147/checkpoint-128/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..d2d76c7e1d6460072528041d39a663e1953f5ab1 --- /dev/null +++ b/dapo_miss_openmath_20251129_124147/checkpoint-128/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95b459995005d37a68cc306b2352b3fff82d378a1b8ad5647ad1befef99c10e1 +size 15365 diff --git a/dapo_miss_openmath_20251129_124147/checkpoint-128/rng_state_1.pth b/dapo_miss_openmath_20251129_124147/checkpoint-128/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..da6b30aaa1e39fa9fe0ba525d993b6e8e6780a96 --- /dev/null +++ b/dapo_miss_openmath_20251129_124147/checkpoint-128/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72f1e8244d687931f482c9c12841eaa066448a09541a616aac6a5e3b9a11828e +size 15429 diff --git a/dapo_miss_openmath_20251129_124147/checkpoint-128/rng_state_2.pth b/dapo_miss_openmath_20251129_124147/checkpoint-128/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..7b57dfd75ad9f4e9dec4cdb6719bec50b98011a6 --- /dev/null +++ b/dapo_miss_openmath_20251129_124147/checkpoint-128/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64f1bf5be50b440a4df0e2a6bef587684b5a12cfe57990dbe38bdddbaf7099aa +size 15429 diff --git a/dapo_miss_openmath_20251129_124147/checkpoint-128/rng_state_3.pth b/dapo_miss_openmath_20251129_124147/checkpoint-128/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..155f6f5d86d68ea7a66494dca2d346f0783b34c1 --- /dev/null +++ b/dapo_miss_openmath_20251129_124147/checkpoint-128/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:61739aa59dd374acb6c6fd9b55a50848cb6fb038349892d16e913d581ca16231 +size 15429 diff --git a/dapo_miss_openmath_20251129_124147/checkpoint-128/scheduler.pt b/dapo_miss_openmath_20251129_124147/checkpoint-128/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d08ae64295b57090bbaa5d6676253533d838873 --- /dev/null +++ b/dapo_miss_openmath_20251129_124147/checkpoint-128/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a72d1751ecd37a23ecd20bd8b9260f394c2f370cb5db8d203bad7d01395f4fb8 +size 1465 diff --git a/dapo_miss_openmath_20251129_124147/checkpoint-128/training_args.bin b/dapo_miss_openmath_20251129_124147/checkpoint-128/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..4aaf77970b3dff8064090e296d624d3538978ae9 --- /dev/null +++ b/dapo_miss_openmath_20251129_124147/checkpoint-128/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c5c215d84703cfc98ad11de2d9f07cdf4b5dc3343d7447f227ef9ac39f64c06 +size 8849 diff --git a/dapo_miss_openmath_20251129_124147/checkpoint-192/global_step192/mp_rank_00_model_states.pt b/dapo_miss_openmath_20251129_124147/checkpoint-192/global_step192/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..00e4d15c2e9dc66ffcbbe9d91027be122e3675d2 --- /dev/null +++ b/dapo_miss_openmath_20251129_124147/checkpoint-192/global_step192/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1fb4b48ff92afca09161c12b050b99ada721b2924d943534db5958e099133133 +size 503979621 diff --git a/dapo_miss_openmath_20251129_124147/checkpoint-192/rng_state_0.pth b/dapo_miss_openmath_20251129_124147/checkpoint-192/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..8c610a9c45c8276ef733e8a6d928fe7e9fc79594 --- /dev/null +++ b/dapo_miss_openmath_20251129_124147/checkpoint-192/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c54cf8d9b60ec8f7f3af441672fd8cf8aa71310c6650f7b47d5cba25c45e694b +size 15365 diff --git a/dapo_miss_openmath_20251129_124147/checkpoint-192/rng_state_1.pth b/dapo_miss_openmath_20251129_124147/checkpoint-192/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..4c878e6c98aff8858da71722dc7957ca2d63f941 --- /dev/null +++ b/dapo_miss_openmath_20251129_124147/checkpoint-192/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc4cf5ee91757d6c3a32c93905509bda025154fa00f2f24a7652dfddec4b6c96 +size 15429 diff --git a/dapo_miss_openmath_20251129_124147/checkpoint-192/rng_state_2.pth b/dapo_miss_openmath_20251129_124147/checkpoint-192/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..ee3eb2ae81fdc91c7e41b882dcf7da6a7c25604c --- /dev/null +++ b/dapo_miss_openmath_20251129_124147/checkpoint-192/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1220afda81f98ae75ab016f763139c9c71c3ff79c0aa0d52895ff0fdc96b7d4d +size 15429 diff --git a/dapo_miss_openmath_20251129_124147/checkpoint-192/rng_state_3.pth b/dapo_miss_openmath_20251129_124147/checkpoint-192/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..c6b6c26e4b9f4c1904419ab8cb457011a954c9a6 --- /dev/null +++ b/dapo_miss_openmath_20251129_124147/checkpoint-192/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f905c06b77fcf55a96820668e1e0ef5b166bf2f04b5d9852afb33d3646c81ae +size 15429 diff --git a/dapo_miss_openmath_20251129_124147/checkpoint-192/scheduler.pt b/dapo_miss_openmath_20251129_124147/checkpoint-192/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb4e8900ca74d271df161df3e78c5e3163d3ca2c --- /dev/null +++ b/dapo_miss_openmath_20251129_124147/checkpoint-192/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ac63e93328a0491bc31c5b67747712626467b0c1fab68bd8f3a90d2ffc2d318 +size 1465 diff --git a/dapo_miss_openmath_20251129_124147/checkpoint-192/training_args.bin b/dapo_miss_openmath_20251129_124147/checkpoint-192/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..4aaf77970b3dff8064090e296d624d3538978ae9 --- /dev/null +++ b/dapo_miss_openmath_20251129_124147/checkpoint-192/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c5c215d84703cfc98ad11de2d9f07cdf4b5dc3343d7447f227ef9ac39f64c06 +size 8849 diff --git a/dapo_miss_openmath_20251129_124147/checkpoint-256/rng_state_2.pth b/dapo_miss_openmath_20251129_124147/checkpoint-256/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..1f08c2093d616c1f6c4a0a6cffed10bb5a442eef --- /dev/null +++ b/dapo_miss_openmath_20251129_124147/checkpoint-256/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97f8dc1a85e1518c0ef85109246d4d9e5d4d661c63b7076193838581fca9b5ae +size 15429 diff --git a/dapo_miss_openmath_20251129_124147/checkpoint-256/scheduler.pt b/dapo_miss_openmath_20251129_124147/checkpoint-256/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..5da175406e5951634027623c46687436be96a222 --- /dev/null +++ b/dapo_miss_openmath_20251129_124147/checkpoint-256/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8495f527d2ae384d255f961a1b604892e1f5459d17e99146a7b64167ecb9365 +size 1465 diff --git a/dapo_miss_openmath_20251129_124147/checkpoint-512/global_step512/mp_rank_00_model_states.pt b/dapo_miss_openmath_20251129_124147/checkpoint-512/global_step512/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..42b4540cf9878d99decc7d886dcd73707886ac48 --- /dev/null +++ b/dapo_miss_openmath_20251129_124147/checkpoint-512/global_step512/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c91f47f2622f940f12c4b61eb2495d9bf94f5c64c3f48b3b4b98e4b36303417 +size 503979621 diff --git a/dapo_miss_openmath_20251129_124147/checkpoint-960/global_step960/mp_rank_00_model_states.pt b/dapo_miss_openmath_20251129_124147/checkpoint-960/global_step960/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..14c1a8eb77500ee17c14059c335596173808a97c --- /dev/null +++ b/dapo_miss_openmath_20251129_124147/checkpoint-960/global_step960/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1751fc3f739474accf29dc9ad65aae2b5db8b653a78cb9827fee72f3a3e9980 +size 503979621 diff --git a/dapo_miss_openmath_20251129_124147/tokenizer.json b/dapo_miss_openmath_20251129_124147/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..51ebb3ba93988c73bbd83a3c163a14343fbc5b06 --- /dev/null +++ b/dapo_miss_openmath_20251129_124147/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c5ae00e602b8860cbd784ba82a8aa14e8feecec692e7076590d014d7b7fdafa +size 11421896 diff --git a/dapo_miss_openmath_20251129_124147/training_args.bin b/dapo_miss_openmath_20251129_124147/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..4aaf77970b3dff8064090e296d624d3538978ae9 --- /dev/null +++ b/dapo_miss_openmath_20251129_124147/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c5c215d84703cfc98ad11de2d9f07cdf4b5dc3343d7447f227ef9ac39f64c06 +size 8849 diff --git a/dr_grpo_lora_20251129_132413/checkpoint-576/global_step576/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/dr_grpo_lora_20251129_132413/checkpoint-576/global_step576/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..89d592ac1ba80281112132254f1a795d1c22190f --- /dev/null +++ b/dr_grpo_lora_20251129_132413/checkpoint-576/global_step576/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc7bb39bc9f2d32dcfe646f068c93c2b752e0eb61b187aefdd70b6dc55eb5d0b +size 55408773 diff --git a/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-832/tokenizer.json b/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-832/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..1a2db243e47cbc113f6b2ddcc388aeeb8fe1a94c --- /dev/null +++ b/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-832/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893 +size 11422778 diff --git a/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-832/training_args.bin b/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-832/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..aecb99b3f26384aee356780c931fbfecb9e94e92 --- /dev/null +++ b/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-832/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cbe5b31134a094422fde08c9d7fd4c7b9deb533ab123345f5a4814519decf5bb +size 8849 diff --git a/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-896/rng_state_2.pth b/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-896/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..eb32b62dd5fbaa74bdfc3fe720ab19218cd701da --- /dev/null +++ b/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-896/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f7dab561c9f5e7cc9cfb34dcc558820c625f058fe107bdaebe989e28ac42e09 +size 15429 diff --git a/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-896/tokenizer.json b/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-896/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..1a2db243e47cbc113f6b2ddcc388aeeb8fe1a94c --- /dev/null +++ b/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-896/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893 +size 11422778 diff --git a/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-960/rng_state_3.pth b/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-960/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..ba8c0dc5d395c2f75a48615afed16e0823403524 --- /dev/null +++ b/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-960/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f2c99c368169e26ffbdedf3c85f300d0e254f3f0c79af06d1f2e894222eed98 +size 15429 diff --git a/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-960/tokenizer.json b/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-960/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..1a2db243e47cbc113f6b2ddcc388aeeb8fe1a94c --- /dev/null +++ b/grpo_full_qwen2_5_3b_20251121_111716/checkpoint-960/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893 +size 11422778