Add files using upload-large-folder tool
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +42 -0
- dapo_lora_lr5_20251129_222821/checkpoint-320/global_step320/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt +3 -0
- dapo_lora_lr5_20251129_222821/checkpoint-64/global_step64/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
- dapo_lora_lr5_20251129_222821/checkpoint-64/global_step64/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt +3 -0
- dapo_lora_lr5_20251129_222821/checkpoint-704/global_step704/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
- dapo_lora_lr5_20251129_222821/checkpoint-704/global_step704/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt +3 -0
- dapo_lora_lr5_20251129_222821/checkpoint-768/global_step768/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
- dapo_lora_lr5_20251129_222821/checkpoint-896/global_step896/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
- dapo_lora_lr5_20251129_222821/checkpoint-896/global_step896/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt +3 -0
- dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-1024/global_step1024/mp_rank_00_model_states.pt +3 -0
- dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-256/global_step256/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
- dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-384/global_step384/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
- dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-384/global_step384/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt +3 -0
- dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-384/global_step384/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt +3 -0
- dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-448/global_step448/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
- dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-448/global_step448/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
- dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-448/global_step448/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt +3 -0
- dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-512/global_step512/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
- dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-512/global_step512/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
- dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-512/global_step512/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt +3 -0
- dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-512/global_step512/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt +3 -0
- dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-576/global_step576/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
- dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-576/global_step576/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt +3 -0
- dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-64/global_step64/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
- dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-64/global_step64/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
- dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-64/global_step64/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt +3 -0
- dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-640/global_step640/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
- dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-640/global_step640/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
- dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-640/global_step640/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt +3 -0
- dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-640/global_step640/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt +3 -0
- dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-704/adapter_model.safetensors +3 -0
- dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-704/global_step704/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
- dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-704/global_step704/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt +3 -0
- dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-704/global_step704/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt +3 -0
- dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-768/global_step768/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
- dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-768/global_step768/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
- dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-768/global_step768/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt +3 -0
- dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-768/global_step768/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt +3 -0
- dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-832/adapter_model.safetensors +3 -0
- dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-832/global_step832/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
- dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-832/global_step832/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
- dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-832/global_step832/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt +3 -0
- dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-832/global_step832/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt +3 -0
- dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-896/adapter_model.safetensors +3 -0
- dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-896/global_step896/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
- dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-896/global_step896/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt +3 -0
- dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-896/global_step896/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt +3 -0
- dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-960/global_step960/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
- dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-960/global_step960/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
- dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-960/global_step960/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt +3 -0
.gitattributes
CHANGED
|
@@ -144,3 +144,45 @@ dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-896/tokenizer.json filter=lf
|
|
| 144 |
dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-960/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 145 |
dapo_miss_openmath_20251129_124147/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 146 |
grpo_full_qwen2_5_3b_20251121_111716/checkpoint-896/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 144 |
dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-960/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 145 |
dapo_miss_openmath_20251129_124147/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 146 |
grpo_full_qwen2_5_3b_20251121_111716/checkpoint-896/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 147 |
+
dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-576/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 148 |
+
dapo_lora_r8_20251129_135342/checkpoint-832/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 149 |
+
dapo_lora_r8_20251129_135342/checkpoint-896/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 150 |
+
dapo_lora_r8_20251129_135342/checkpoint-960/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 151 |
+
dapo_milora_qwen2_5_1_5b_20251126_224006/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 152 |
+
dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-256/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 153 |
+
dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-320/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 154 |
+
dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-384/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 155 |
+
dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-512/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 156 |
+
dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-448/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 157 |
+
dapo_lora_r8_20251129_135342/checkpoint-704/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 158 |
+
dapo_lora_r8_20251129_135342/checkpoint-768/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 159 |
+
dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-896/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 160 |
+
dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-960/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 161 |
+
dapo_lora_r8_20251129_135342/checkpoint-1024/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 162 |
+
dapo_lora_r8_20251129_135342/checkpoint-320/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 163 |
+
dapo_lora_r8_20251129_135342/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 164 |
+
dapo_lora_r8_20251129_135342/checkpoint-192/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 165 |
+
dapo_lora_r8_20251129_135342/checkpoint-256/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 166 |
+
dapo_lora_r8_20251129_135342/checkpoint-128/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 167 |
+
dapo_lora_r8_20251129_135342/checkpoint-384/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 168 |
+
dapo_lora_r8_20251129_135342/checkpoint-64/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 169 |
+
dapo_lora_r8_20251129_135342/checkpoint-448/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 170 |
+
dapo_lora_r8_20251129_135342/checkpoint-576/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 171 |
+
dapo_lora_r8_20251129_135342/checkpoint-512/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 172 |
+
dapo_lora_r8_20251129_135342/checkpoint-640/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 173 |
+
dapo_miss_openmath_20251129_124147/checkpoint-1024/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 174 |
+
dapo_miss_openmath_20251129_124147/checkpoint-128/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 175 |
+
dapo_miss_openmath_20251129_124147/checkpoint-192/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 176 |
+
dapo_miss_openmath_20251129_124147/checkpoint-256/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 177 |
+
dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-128/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 178 |
+
dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-1024/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 179 |
+
dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-192/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 180 |
+
dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-256/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 181 |
+
dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-448/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 182 |
+
grpo_full_qwen2_5_3b_20251121_111716/checkpoint-384/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 183 |
+
grpo_full_qwen2_5_3b_20251121_111716/checkpoint-512/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 184 |
+
grpo_full_qwen2_5_3b_20251121_111716/checkpoint-64/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 185 |
+
grpo_full_qwen2_5_3b_20251121_111716/checkpoint-576/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 186 |
+
grpo_full_qwen2_5_3b_20251121_111716/checkpoint-640/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 187 |
+
dapo_miss_qwen2_5_1_5b_20251124_220354/checkpoint-896/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 188 |
+
dapo_miss_qwen2_5_1_5b_20251124_220354/checkpoint-960/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
dapo_lora_lr5_20251129_222821/checkpoint-320/global_step320/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d0af91fa94c1610d26324df519780960ada6a1f27e6c74457200f6f046518b7e
|
| 3 |
+
size 110803141
|
dapo_lora_lr5_20251129_222821/checkpoint-64/global_step64/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7e61d560af8f44e44ea55c365f6bda9b655b62fd537dbb8589e58c8acfdd6e2d
|
| 3 |
+
size 110803077
|
dapo_lora_lr5_20251129_222821/checkpoint-64/global_step64/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:43782022f1851c42edab18d1c5f754ce3318a94c6cfd07c10589121054d43acb
|
| 3 |
+
size 110803141
|
dapo_lora_lr5_20251129_222821/checkpoint-704/global_step704/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9f63a4cf9a2c4463735a8001cb5dbf663a82c5b8dde35de52e313a5098e3d25b
|
| 3 |
+
size 110803077
|
dapo_lora_lr5_20251129_222821/checkpoint-704/global_step704/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9858506d5dc9b37ac0934b2c44e6478e6c90de6289e4eab46bfd23dca29e4d70
|
| 3 |
+
size 110803141
|
dapo_lora_lr5_20251129_222821/checkpoint-768/global_step768/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8d62d43f0589d5a774cc4ba084fae39730c03afd1f6529d10822901c526a1a42
|
| 3 |
+
size 110803077
|
dapo_lora_lr5_20251129_222821/checkpoint-896/global_step896/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:46ed58d17dd28520ff467ff12f58d2d6ffc34d7f0447ca1a77dabf050c32daef
|
| 3 |
+
size 110803077
|
dapo_lora_lr5_20251129_222821/checkpoint-896/global_step896/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8b91cfcffe025fa39bd52df7ae8603e7ecad8c3cf1f02b22594f9a3cc82bdb10
|
| 3 |
+
size 110803141
|
dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-1024/global_step1024/mp_rank_00_model_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ae04a994c37693b00f7f962f1f211233e1d17bc520278b5f7a4958b7f6b21ab4
|
| 3 |
+
size 503979621
|
dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-256/global_step256/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c173f80e553c6402b63194adfa25d1ac0bd85953f8851eacf4b695efabb70c25
|
| 3 |
+
size 55408773
|
dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-384/global_step384/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:891309f12d74e579d4b2a160b4bcf4d5eb1b9e3c2eb051bce449babdd7f282e3
|
| 3 |
+
size 55408773
|
dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-384/global_step384/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:35b4acc54f285d39837fb8f3cb7babe474b62f8d0fb7ba77f2e85f6ab7559058
|
| 3 |
+
size 55408837
|
dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-384/global_step384/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:73ab8a32b47361d5715d893043ccb60c9cdce6eb03e27dc46e57df0a14eee7ae
|
| 3 |
+
size 55408837
|
dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-448/global_step448/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5e1dcaf732a948cf7a50f302152165b5104eedfb18a70442b8a65a2166542480
|
| 3 |
+
size 55408773
|
dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-448/global_step448/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5226b106ef4399b09158f8718db0429575809b2771b751be8d1420301d4faa1c
|
| 3 |
+
size 55408773
|
dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-448/global_step448/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:38f422db28bd7cbbf94455b7c5938c08e9dce26082688ca6f8809dde5cf96a82
|
| 3 |
+
size 55408837
|
dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-512/global_step512/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c708ac2a56999d8f95eec4c5b2d5d33ce7d73acc7286f7030deb351ebde2ad31
|
| 3 |
+
size 55408773
|
dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-512/global_step512/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:bcdda7b81653c64a3b84a47fbbab27e73126c01d4fed3f71f39fc1c70e04e409
|
| 3 |
+
size 55408773
|
dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-512/global_step512/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5f1c2ee723f342ea0e40518d97402dbb7cfdf3f7ccc7bfd569d7a05c8e52c531
|
| 3 |
+
size 55408837
|
dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-512/global_step512/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:59195cba6a18b9f10b45eb779dbe7bdb9165776bd5f070345a7a0a43ad769384
|
| 3 |
+
size 55408837
|
dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-576/global_step576/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ab7b90ad83442282f9e32c7ebe09e8a928bb21d66d37e7395c570ad7a05336f6
|
| 3 |
+
size 55408773
|
dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-576/global_step576/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:23bdd2fc827e4743510e0a9069ea2ba2cef1f53b7aeb7c55ce1e188f471373e3
|
| 3 |
+
size 55408837
|
dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-64/global_step64/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6302e73dc96b08ce363eba908f3a38c4b12517c8e28bf6528ca133fbe579619e
|
| 3 |
+
size 55408773
|
dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-64/global_step64/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7d7d899edea76ec13fad77022e08b7dc02cfb5d307607eb38cb47d38a3ece5c6
|
| 3 |
+
size 55408773
|
dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-64/global_step64/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6d3a85565f7e407cf1e18e6c58f84583443d68f16ae89b64065eb9c96d9027af
|
| 3 |
+
size 55408837
|
dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-640/global_step640/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:077819e24822d61a5ffc0643f6edfa4acee55ae1e413ce52e6e70efdb3223c92
|
| 3 |
+
size 55408773
|
dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-640/global_step640/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:eb9777c0e29a8b4c103c903cefe4f99dcd4494f72ebd61c5ef92cb3a0d2ec92d
|
| 3 |
+
size 55408773
|
dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-640/global_step640/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fc27fe7078af666ff592665254037ef893dfa00270077c5420e8c525c79ea515
|
| 3 |
+
size 55408837
|
dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-640/global_step640/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c1ea48117ae31f72542f7e44155ace0461b0a39dc2491b588da754676aab246e
|
| 3 |
+
size 55408837
|
dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-704/adapter_model.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:45a4b54b071716e3dff2404aab252f8cfa81dbea9bcc94a255d04ad66e82ccb3
|
| 3 |
+
size 36981856
|
dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-704/global_step704/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9f55753d8feebdac46671689cb05e1d8e48d31bde939d461ac8c70529f627023
|
| 3 |
+
size 55408773
|
dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-704/global_step704/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:23aee3396d9e328d7bf9fedf9567091db8f907f6972d3300008136bf0e26d6e1
|
| 3 |
+
size 55408837
|
dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-704/global_step704/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:716d04c8400d2b013030e40f981724b86a2425b7fa36369b7cb081f191300b87
|
| 3 |
+
size 55408837
|
dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-768/global_step768/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b7f4f5e79e23c9bf656d32fadac7a179aecbf170a85f2a284f05269f2785daa8
|
| 3 |
+
size 55408773
|
dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-768/global_step768/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:27f2358fc29df07c12d7e90ad7c60b137f4fe0c980c73cac87798c81766d40d0
|
| 3 |
+
size 55408773
|
dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-768/global_step768/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:096271c9237df42169929a141b5833bdaef66cde2e12e05a9ab44dc5c0f51cdf
|
| 3 |
+
size 55408837
|
dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-768/global_step768/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e2de8b7503c6a435e15ab55b5b622c934c4a965859b99bc981efbc7048fcf62b
|
| 3 |
+
size 55408837
|
dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-832/adapter_model.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:eefb59c1f5dc727ebfeb008094fdc6f7f030a7acdfbe40743ed0fd322e53e2f4
|
| 3 |
+
size 36981856
|
dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-832/global_step832/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:78dfe1964501784207ee53c77ba9d42420c1754407a05f140ede870bc0d561c6
|
| 3 |
+
size 55408773
|
dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-832/global_step832/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fcc2bf523806805907cc8f8dd2d48095cd4e31978d5884efc96128cf22d76357
|
| 3 |
+
size 55408773
|
dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-832/global_step832/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d4e83e929b8f8bd2fc20274deff9ae942bd75ecd7155e3d439917128731db6e4
|
| 3 |
+
size 55408837
|
dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-832/global_step832/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:945b0b1cb28d1ff18336559320315ab43643ae7b2bcac986d772b63e24323d63
|
| 3 |
+
size 55408837
|
dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-896/adapter_model.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:08a969dd0c97ca0262352193dd09fdd82dbc13e0692879320913fcb45ceee7f6
|
| 3 |
+
size 36981856
|
dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-896/global_step896/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c13ea7f654aaea2a7400b6b97b67af7422538cd27a74da3b0a9a9572f2f1fcb4
|
| 3 |
+
size 55408773
|
dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-896/global_step896/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9c7d40c938363993b77c30a7f5e374b1f027c14b04f2842c8e72de4eaad6e541
|
| 3 |
+
size 55408837
|
dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-896/global_step896/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:132b6fde99a306af9f933041db48f877de556219975ebeb800030db53647aa33
|
| 3 |
+
size 55408837
|
dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-960/global_step960/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:dcbc8dedd1a9a23883f111254f5cfefed63c3e2e6aec0233c46317bd32aac6f3
|
| 3 |
+
size 55408773
|
dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-960/global_step960/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:91fb7ac83b6decc36e431ab48ffdd6a577fc03072ebea1aa0198df2b631b9365
|
| 3 |
+
size 55408773
|
dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-960/global_step960/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5926ac5870d3bdaa700fb2db69b0cdc6f662af534dafe10d46c357408d5faf32
|
| 3 |
+
size 55408837
|