Add files using upload-large-folder tool
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +68 -0
- dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-512/adapter_model.safetensors +3 -0
- dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-512/global_step512/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
- dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-512/global_step512/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
- dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-512/global_step512/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt +3 -0
- dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-512/global_step512/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt +3 -0
- dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-576/global_step576/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
- dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-576/global_step576/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
- dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-576/global_step576/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt +3 -0
- dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-576/global_step576/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt +3 -0
- dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-64/global_step64/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
- dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-64/global_step64/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
- dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-64/global_step64/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt +3 -0
- dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-64/global_step64/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt +3 -0
- dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-640/global_step640/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
- dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-640/global_step640/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
- dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-640/global_step640/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt +3 -0
- dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-640/global_step640/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt +3 -0
- dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-704/global_step704/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
- dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-704/global_step704/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
- dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-704/global_step704/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt +3 -0
- dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-704/global_step704/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt +3 -0
- dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-768/global_step768/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
- dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-768/global_step768/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
- dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-768/global_step768/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt +3 -0
- dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-768/global_step768/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt +3 -0
- dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-832/global_step832/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
- dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-832/global_step832/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
- dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-832/global_step832/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt +3 -0
- dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-832/global_step832/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt +3 -0
- dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-896/global_step896/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
- dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-896/global_step896/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
- dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-896/global_step896/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt +3 -0
- dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-896/global_step896/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt +3 -0
- dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-896/global_step896/mp_rank_00_model_states.pt +3 -0
- dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-960/global_step960/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
- dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-960/global_step960/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
- dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-960/global_step960/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt +3 -0
- dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-960/global_step960/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt +3 -0
- dapo_ia3_qwen2_5_1_5b_20251128_120647/adapter_model.safetensors +3 -0
- dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-1024/global_step1024/mp_rank_00_model_states.pt +3 -0
- dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-128/adapter_model.safetensors +3 -0
- dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-128/global_step128/mp_rank_00_model_states.pt +3 -0
- dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-192/adapter_model.safetensors +3 -0
- dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-256/adapter_model.safetensors +3 -0
- dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-256/global_step256/mp_rank_00_model_states.pt +3 -0
- dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-320/adapter_model.safetensors +3 -0
- dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-320/global_step320/mp_rank_00_model_states.pt +3 -0
- dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-384/adapter_model.safetensors +3 -0
- dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-384/global_step384/mp_rank_00_model_states.pt +3 -0
.gitattributes
CHANGED
|
@@ -76,3 +76,71 @@ dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-64/tokenizer.json filter=lfs d
|
|
| 76 |
dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-512/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 77 |
dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-192/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 78 |
dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-704/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 76 |
dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-512/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 77 |
dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-192/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 78 |
dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-704/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 79 |
+
dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-832/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 80 |
+
dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-768/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 81 |
+
dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-960/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 82 |
+
dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-1024/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 83 |
+
dapo_lora_r16_qwen2_5_3b_20251124_104900/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 84 |
+
dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-128/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 85 |
+
dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-896/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 86 |
+
dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-192/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 87 |
+
dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-576/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 88 |
+
dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-64/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 89 |
+
dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-512/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 90 |
+
dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-640/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 91 |
+
dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-704/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 92 |
+
dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-448/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 93 |
+
dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-384/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 94 |
+
dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-64/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 95 |
+
dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-640/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 96 |
+
dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-704/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 97 |
+
dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-768/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 98 |
+
dapo_lora_r16_qwen2_5_3b_20251124_104900/checkpoint-832/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 99 |
+
grpo_full_qwen2_5_3b_20251121_111716/checkpoint-832/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 100 |
+
grpo_full_qwen2_5_3b_20251121_111716/checkpoint-960/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 101 |
+
dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-832/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 102 |
+
dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-704/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 103 |
+
dapo_lora_lr5_20251129_222821/checkpoint-512/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 104 |
+
dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-896/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 105 |
+
dapo_lora_lr5_20251129_222821/checkpoint-448/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 106 |
+
dapo_lora_lr5_20251129_222821/checkpoint-128/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 107 |
+
dapo_lora_lr5_20251129_222821/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 108 |
+
dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-960/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 109 |
+
dapo_lora_lr5_20251129_222821/checkpoint-384/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 110 |
+
dapo_lora_lr5_20251129_222821/checkpoint-320/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 111 |
+
dapo_lora_lr5_20251129_222821/checkpoint-192/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 112 |
+
dapo_lora_lr5_20251129_222821/checkpoint-256/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 113 |
+
dapo_lora_lr5_20251129_222821/checkpoint-1024/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 114 |
+
dapo_lora_lr5_20251129_222821/checkpoint-576/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 115 |
+
dapo_lora_lr5_20251129_222821/checkpoint-640/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 116 |
+
dapo_lora_lr5_20251129_222821/checkpoint-704/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 117 |
+
dapo_lora_lr5_20251129_222821/checkpoint-768/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 118 |
+
dapo_lora_lr5_20251129_222821/checkpoint-64/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 119 |
+
dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-192/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 120 |
+
dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-384/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 121 |
+
dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-448/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 122 |
+
dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-512/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 123 |
+
dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-640/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 124 |
+
dapo_layernorm_qwen2_5_1_5b_20251127_195534/checkpoint-768/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 125 |
+
dapo_lora_lr5_20251129_222821/checkpoint-832/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 126 |
+
dapo_lora_qwen2_5_3b_20251129_022228/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 127 |
+
dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-1024/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 128 |
+
dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-128/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 129 |
+
dapo_lora_lr5_20251129_222821/checkpoint-896/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 130 |
+
dapo_lora_lr5_20251129_222821/checkpoint-960/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 131 |
+
dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-192/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 132 |
+
dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-256/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 133 |
+
dapo_lora_qwen2_5_3b_20251129_022228/checkpoint-320/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 134 |
+
dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-320/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 135 |
+
dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-384/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 136 |
+
dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-512/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 137 |
+
dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-576/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 138 |
+
dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-640/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 139 |
+
dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-64/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 140 |
+
dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-704/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 141 |
+
dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-832/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 142 |
+
dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-768/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 143 |
+
dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-896/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 144 |
+
dapo_milora_qwen2_5_1_5b_20251126_224006/checkpoint-960/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 145 |
+
dapo_miss_openmath_20251129_124147/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 146 |
+
grpo_full_qwen2_5_3b_20251121_111716/checkpoint-896/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-512/adapter_model.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:17ebbc5e855944009d1140db0720ddd5916113dd3e9fd5a1fd249dd513e84690
|
| 3 |
+
size 75228904
|
dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-512/global_step512/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0efc20e1b84161371a394fd09f5497707cac93ee7ef9264bd043f190ee3718fa
|
| 3 |
+
size 112744453
|
dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-512/global_step512/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a176b2fb7fdb92a42e78601018de78f4ef01901147c1971ca690a8e3a68e59d2
|
| 3 |
+
size 112744517
|
dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-512/global_step512/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8b60fcbf8df2c1283ef750fbd8f3ad2ccba6ddc7ef7e694f554147d6354fa105
|
| 3 |
+
size 112744581
|
dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-512/global_step512/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a799d79f923f9620e1b5db896d3a63786c2d253c128f8bfa345b6242f769f787
|
| 3 |
+
size 112744581
|
dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-576/global_step576/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6ca4e41cd3d43a3404c13226231ae13a8fbed17462ba29367c0f9a3985f67d58
|
| 3 |
+
size 112744453
|
dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-576/global_step576/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:de488a16cc358f58e3a483833bfec9b54dbe86c2fa99c7f87b3d71ba358fadfc
|
| 3 |
+
size 112744517
|
dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-576/global_step576/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b04e00548439d26f0493e677f3f2a56ec81b0086de0d9d1932754d3ac989e275
|
| 3 |
+
size 112744581
|
dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-576/global_step576/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9f5c7d0c13f976105cf458843e8da50f96fec1506c1a2c111059d22c676df6d9
|
| 3 |
+
size 112744581
|
dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-64/global_step64/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:588d0528dcf1721b9c635867e2d1cfe931f627c3a4df8e966d7ccb82d6d116d7
|
| 3 |
+
size 112744453
|
dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-64/global_step64/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6e221647db107bb019cc65fa73d2c760445da0950a4dc8457884ce74dfb4ab13
|
| 3 |
+
size 112744517
|
dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-64/global_step64/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a0f812a77da6b251eaa706b7de9831badfd7ba47e3aca4b624b31741c704c884
|
| 3 |
+
size 112744581
|
dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-64/global_step64/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:48048f334fbfb4a83545d251ac1a30fd2f57d4106c8315609df73fcacfdddb9d
|
| 3 |
+
size 112744581
|
dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-640/global_step640/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e1d7b21880dc152df3ae82f20f46c194b2cd46f3bc7b9ab0737e2abb1f966df9
|
| 3 |
+
size 112744453
|
dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-640/global_step640/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:854c1306d3e4d70e73d6c62f0a4d258ae278b230321989ec3b10a460da459751
|
| 3 |
+
size 112744517
|
dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-640/global_step640/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:077d8a64ec54768845e66be77995226ff4ad1e06820c54bad279ccd0dbcb4d87
|
| 3 |
+
size 112744581
|
dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-640/global_step640/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:178a27ca64066d60a723883444e9155bc961a2c0456f987d4488d1aeef34f88c
|
| 3 |
+
size 112744581
|
dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-704/global_step704/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7b687595595b09f127a33f921ec2a00d8eb8267e6668c2be94b23f2f52a1d098
|
| 3 |
+
size 112744453
|
dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-704/global_step704/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7e1e453eebb9abd2f486dea54e0c01631e1c94b56ef77907c7125a91cc446b23
|
| 3 |
+
size 112744517
|
dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-704/global_step704/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b10e4acae0c6c688d2c4ff1fcdfc9b2eabe37fd9f7c82b81e09184c23dc13b3b
|
| 3 |
+
size 112744581
|
dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-704/global_step704/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:48dcd7d1297bfb30567f306c3ef823e78b84dfe82b5cce8e7a02ce6cdf578af3
|
| 3 |
+
size 112744581
|
dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-768/global_step768/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:96880b8a07727dff0f6ed5b8e2664a6f186e9cc69dc69eeb555a435d538e928c
|
| 3 |
+
size 112744453
|
dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-768/global_step768/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:bdd10d229e0d02747581cda1f64dbcfa79efd7b30fbe89ad0dede590661fd3da
|
| 3 |
+
size 112744517
|
dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-768/global_step768/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:540acb5826296ee78356dc105d7361b077766ab87ee2a52c421dad80aa9d9d93
|
| 3 |
+
size 112744581
|
dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-768/global_step768/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6712a25d20c11d9baa8f92bc31c7e20d4fb7fcc5818a5277e52a8141b3e49904
|
| 3 |
+
size 112744581
|
dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-832/global_step832/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4db17ee1efffefe0bc5083301f0128fa597a7c02d94c8fb87ae44c4f75b01064
|
| 3 |
+
size 112744453
|
dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-832/global_step832/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5c88af48b8f6dc22c6212f80afda930e4e1505941e035f3fd2fa236e1532792e
|
| 3 |
+
size 112744517
|
dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-832/global_step832/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b192a5934e69615b34f13541bb995523d2d0f1bb187fef2667249c605c6997ad
|
| 3 |
+
size 112744581
|
dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-832/global_step832/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f8a35f91694a63690e74e7670d1929582fa312c706bfa55f81190982e0e4d496
|
| 3 |
+
size 112744581
|
dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-896/global_step896/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:02826c3bf16db1ca4e82b9ed35bc089bc0a12b8e66b041077ad39e6e4b8ed69b
|
| 3 |
+
size 112744453
|
dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-896/global_step896/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:14c7d4ba1ea576af91abd42919632dbc8ac9e7585ddd3c8b3db50bbdf9d047d4
|
| 3 |
+
size 112744517
|
dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-896/global_step896/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a1ecf66f588a293a787b363bdcaa30fb1e7e52f693c73d3ce10ad60b544680b2
|
| 3 |
+
size 112744581
|
dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-896/global_step896/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:30e2d29b44514e5fcc1a3a1cb23751a1319a3772be9acdf4e9497f2407227bd7
|
| 3 |
+
size 112744581
|
dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-896/global_step896/mp_rank_00_model_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:cef8d64700b4f15372a94c8c621244a6449ff01ab8a276180d4c4b1cd03e44ca
|
| 3 |
+
size 75529433
|
dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-960/global_step960/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:dcc580e3b5995c9b0c434fe334ba8615ea24f8f71896c7ee8a0fd81b39832cab
|
| 3 |
+
size 112744453
|
dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-960/global_step960/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6573b1b41d3c5aa24f219ad1291e820b5fcb8cd61607d5a79b4f721bd0d70a83
|
| 3 |
+
size 112744517
|
dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-960/global_step960/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e0747d1f6ac256801e0ba754e45f1fcb77ec3de857861515c4be75ab3da308f7
|
| 3 |
+
size 112744581
|
dapo_dora_qwen2_5_1_5b_20251126_115730/checkpoint-960/global_step960/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:523ab8b5c5f5608ab108d9a77a41db62ae043c856cff8ee6b698186da163b3b2
|
| 3 |
+
size 112744581
|
dapo_ia3_qwen2_5_1_5b_20251128_120647/adapter_model.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:60adeea85b30543a79cfc809c3e8f2b9eda7d88111eba2361e9d3920c70a421a
|
| 3 |
+
size 49582616
|
dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-1024/global_step1024/mp_rank_00_model_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:26292eaed3365503633b53ef3e926d07081c4bb8d07e8428d713c1171ba49807
|
| 3 |
+
size 49768921
|
dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-128/adapter_model.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7d411da0accc4c3694b34f72a497fe636a4d2f83845e9da226d8b0a2a18197ec
|
| 3 |
+
size 49582616
|
dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-128/global_step128/mp_rank_00_model_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:68d501313a7e70d248b43a67c77c471fa662c4147c206ec975bb9f96b2419226
|
| 3 |
+
size 49768921
|
dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-192/adapter_model.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d7e7720a192f805000e8a9f300b05ee6d88da5e073735da202b1ed2524c6db1d
|
| 3 |
+
size 49582616
|
dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-256/adapter_model.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:08cc7b0ce5f86bc89168dda412f63c9145c1239b16d5a06ada9fcfd5072bc504
|
| 3 |
+
size 49582616
|
dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-256/global_step256/mp_rank_00_model_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:06c6735c164d3ee473424f5629db78c870d1ca5667bde0cb87e64ec6c9d639a8
|
| 3 |
+
size 49768921
|
dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-320/adapter_model.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:48b0e10e9dff28a5f404a12ff71b200fa684e25b91ff3bbcad00ee998bed62ea
|
| 3 |
+
size 49582616
|
dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-320/global_step320/mp_rank_00_model_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c02630efdc328b38ef0279055906e631adb659cb127f9d06d26b241233482c06
|
| 3 |
+
size 49768921
|
dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-384/adapter_model.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:81dfeda7c2a446729f2dacfc914d51a7dd1ff5b77a8d2c562c4a433f7f91b28e
|
| 3 |
+
size 49582616
|
dapo_ia3_qwen2_5_1_5b_20251128_120647/checkpoint-384/global_step384/mp_rank_00_model_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fe8827547ef3296b2db732ec828d05c541bb9d964480bcef3dc422a84dd78935
|
| 3 |
+
size 49768921
|