MikaStars39 commited on
Commit
3ce9525
·
verified ·
1 Parent(s): 68d6741

Add files using upload-large-folder tool

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. .gitattributes +25 -0
  2. dapo_lorafa_20251201_161746/checkpoint-128/adapter_model.safetensors +3 -0
  3. dapo_lorafa_20251201_161746/checkpoint-128/global_step128/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt +3 -0
  4. dapo_lorafa_20251201_161746/checkpoint-128/global_step128/mp_rank_00_model_states.pt +3 -0
  5. dapo_lorafa_20251201_161746/checkpoint-128/tokenizer.json +3 -0
  6. dapo_lorafa_20251201_161746/checkpoint-192/global_step192/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
  7. dapo_lorafa_20251201_161746/checkpoint-192/global_step192/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
  8. dapo_lorafa_20251201_161746/checkpoint-192/global_step192/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt +3 -0
  9. dapo_lorafa_20251201_161746/checkpoint-192/global_step192/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt +3 -0
  10. dapo_lorafa_20251201_161746/checkpoint-192/tokenizer.json +3 -0
  11. dapo_lorafa_20251201_161746/checkpoint-256/global_step256/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
  12. dapo_lorafa_20251201_161746/checkpoint-256/global_step256/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt +3 -0
  13. dapo_lorafa_20251201_161746/checkpoint-256/global_step256/mp_rank_00_model_states.pt +3 -0
  14. dapo_lorafa_20251201_161746/checkpoint-256/tokenizer.json +3 -0
  15. dapo_lorafa_20251201_161746/checkpoint-320/tokenizer.json +3 -0
  16. dapo_lorafa_20251201_161746/checkpoint-384/global_step384/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
  17. dapo_lorafa_20251201_161746/checkpoint-384/global_step384/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
  18. dapo_lorafa_20251201_161746/checkpoint-384/global_step384/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt +3 -0
  19. dapo_lorafa_20251201_161746/checkpoint-384/global_step384/mp_rank_00_model_states.pt +3 -0
  20. dapo_lorafa_20251201_161746/checkpoint-384/tokenizer.json +3 -0
  21. dapo_lorafa_20251201_161746/checkpoint-448/global_step448/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt +3 -0
  22. dapo_lorafa_20251201_161746/checkpoint-448/global_step448/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt +3 -0
  23. dapo_lorafa_20251201_161746/checkpoint-448/global_step448/mp_rank_00_model_states.pt +3 -0
  24. dapo_lorafa_20251201_161746/checkpoint-448/tokenizer.json +3 -0
  25. dapo_lorafa_20251201_161746/checkpoint-512/adapter_model.safetensors +3 -0
  26. dapo_lorafa_20251201_161746/checkpoint-512/tokenizer.json +3 -0
  27. dapo_lorafa_20251201_161746/checkpoint-64/tokenizer.json +3 -0
  28. dr_grpo_lora_20251130_192918/adapter_model.safetensors +3 -0
  29. dr_grpo_lora_20251130_192918/checkpoint-1024/adapter_model.safetensors +3 -0
  30. dr_grpo_lora_20251130_192918/checkpoint-1024/global_step1024/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
  31. dr_grpo_lora_20251130_192918/checkpoint-1024/global_step1024/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
  32. dr_grpo_lora_20251130_192918/checkpoint-1024/global_step1024/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt +3 -0
  33. dr_grpo_lora_20251130_192918/checkpoint-1024/global_step1024/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt +3 -0
  34. dr_grpo_lora_20251130_192918/checkpoint-1024/global_step1024/mp_rank_00_model_states.pt +3 -0
  35. dr_grpo_lora_20251130_192918/checkpoint-1024/tokenizer.json +3 -0
  36. dr_grpo_lora_20251130_192918/checkpoint-128/adapter_model.safetensors +3 -0
  37. dr_grpo_lora_20251130_192918/checkpoint-128/global_step128/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
  38. dr_grpo_lora_20251130_192918/checkpoint-128/global_step128/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt +3 -0
  39. dr_grpo_lora_20251130_192918/checkpoint-128/global_step128/mp_rank_00_model_states.pt +3 -0
  40. dr_grpo_lora_20251130_192918/checkpoint-128/tokenizer.json +3 -0
  41. dr_grpo_lora_20251130_192918/checkpoint-192/adapter_model.safetensors +3 -0
  42. dr_grpo_lora_20251130_192918/checkpoint-192/global_step192/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt +3 -0
  43. dr_grpo_lora_20251130_192918/checkpoint-192/global_step192/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt +3 -0
  44. dr_grpo_lora_20251130_192918/checkpoint-192/global_step192/mp_rank_00_model_states.pt +3 -0
  45. dr_grpo_lora_20251130_192918/checkpoint-192/tokenizer.json +3 -0
  46. dr_grpo_lora_20251130_192918/checkpoint-256/global_step256/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
  47. dr_grpo_lora_20251130_192918/checkpoint-256/global_step256/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
  48. dr_grpo_lora_20251130_192918/checkpoint-256/global_step256/mp_rank_00_model_states.pt +3 -0
  49. dr_grpo_lora_20251130_192918/checkpoint-256/tokenizer.json +3 -0
  50. dr_grpo_lora_20251130_192918/checkpoint-320/global_step320/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
.gitattributes CHANGED
@@ -270,3 +270,28 @@ grpo_full_qwen2_5_3b_20251121_111716/checkpoint-256/tokenizer.json filter=lfs di
270
  grpo_full_qwen2_5_3b_20251121_111716/checkpoint-192/tokenizer.json filter=lfs diff=lfs merge=lfs -text
271
  dr_grpo_lora_20251129_132413/checkpoint-832/tokenizer.json filter=lfs diff=lfs merge=lfs -text
272
  dr_grpo_lora_20251129_132413/checkpoint-960/tokenizer.json filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
270
  grpo_full_qwen2_5_3b_20251121_111716/checkpoint-192/tokenizer.json filter=lfs diff=lfs merge=lfs -text
271
  dr_grpo_lora_20251129_132413/checkpoint-832/tokenizer.json filter=lfs diff=lfs merge=lfs -text
272
  dr_grpo_lora_20251129_132413/checkpoint-960/tokenizer.json filter=lfs diff=lfs merge=lfs -text
273
+ dr_grpo_lora_20251130_192918/tokenizer.json filter=lfs diff=lfs merge=lfs -text
274
+ dapo_lorafa_20251201_161746/checkpoint-192/tokenizer.json filter=lfs diff=lfs merge=lfs -text
275
+ dapo_lorafa_20251201_161746/checkpoint-64/tokenizer.json filter=lfs diff=lfs merge=lfs -text
276
+ dr_grpo_lora_20251130_192918/checkpoint-384/tokenizer.json filter=lfs diff=lfs merge=lfs -text
277
+ dapo_lorafa_20251201_161746/checkpoint-512/tokenizer.json filter=lfs diff=lfs merge=lfs -text
278
+ dapo_lorafa_20251201_161746/checkpoint-384/tokenizer.json filter=lfs diff=lfs merge=lfs -text
279
+ dr_grpo_lora_20251130_192918/checkpoint-192/tokenizer.json filter=lfs diff=lfs merge=lfs -text
280
+ dr_grpo_lora_20251130_192918/checkpoint-960/tokenizer.json filter=lfs diff=lfs merge=lfs -text
281
+ dapo_lorafa_20251201_161746/checkpoint-256/tokenizer.json filter=lfs diff=lfs merge=lfs -text
282
+ dr_grpo_lora_20251130_192918/checkpoint-448/tokenizer.json filter=lfs diff=lfs merge=lfs -text
283
+ dapo_lorafa_20251201_161746/checkpoint-448/tokenizer.json filter=lfs diff=lfs merge=lfs -text
284
+ dapo_lorafa_20251201_161746/checkpoint-320/tokenizer.json filter=lfs diff=lfs merge=lfs -text
285
+ dr_grpo_lora_20251130_192918/checkpoint-1024/tokenizer.json filter=lfs diff=lfs merge=lfs -text
286
+ dapo_lorafa_20251201_161746/checkpoint-128/tokenizer.json filter=lfs diff=lfs merge=lfs -text
287
+ dr_grpo_lora_20251130_192918/checkpoint-768/tokenizer.json filter=lfs diff=lfs merge=lfs -text
288
+ dr_grpo_lora_20251130_192918/checkpoint-128/tokenizer.json filter=lfs diff=lfs merge=lfs -text
289
+ dr_grpo_lora_20251130_192918/checkpoint-896/tokenizer.json filter=lfs diff=lfs merge=lfs -text
290
+ dr_grpo_lora_20251130_192918/checkpoint-576/tokenizer.json filter=lfs diff=lfs merge=lfs -text
291
+ dr_grpo_lora_20251130_192918/checkpoint-512/tokenizer.json filter=lfs diff=lfs merge=lfs -text
292
+ dr_grpo_lora_20251130_192918/checkpoint-832/tokenizer.json filter=lfs diff=lfs merge=lfs -text
293
+ dr_grpo_lora_20251130_192918/checkpoint-256/tokenizer.json filter=lfs diff=lfs merge=lfs -text
294
+ dr_grpo_lora_20251130_192918/checkpoint-64/tokenizer.json filter=lfs diff=lfs merge=lfs -text
295
+ dr_grpo_lora_20251130_192918/checkpoint-640/tokenizer.json filter=lfs diff=lfs merge=lfs -text
296
+ dr_grpo_lora_20251130_192918/checkpoint-320/tokenizer.json filter=lfs diff=lfs merge=lfs -text
297
+ dr_grpo_lora_20251130_192918/checkpoint-704/tokenizer.json filter=lfs diff=lfs merge=lfs -text
dapo_lorafa_20251201_161746/checkpoint-128/adapter_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:283a421f3de882f21c05ad122d3ce00a399e1e78a2784de18b9180ecc14ea7e6
3
+ size 73911504
dapo_lorafa_20251201_161746/checkpoint-128/global_step128/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4a2eeae195a344c01c1aa127e9628eaa84fcc2b4d0d692599b4438c57270c792
3
+ size 61940677
dapo_lorafa_20251201_161746/checkpoint-128/global_step128/mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4ea176f800b9c859a3d772c31b9b37adb1501da856a61f7c6f1b67d7fb723513
3
+ size 41536409
dapo_lorafa_20251201_161746/checkpoint-128/tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893
3
+ size 11422778
dapo_lorafa_20251201_161746/checkpoint-192/global_step192/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ab7ccff0c1e1d7b9654b8a5ce12899fe6f1ee1bd1d0301a9c41b4a7c6981fa47
3
+ size 61940613
dapo_lorafa_20251201_161746/checkpoint-192/global_step192/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bce1ac94be81b53f2c90ffdeb6eecbd1f8b4b1aa978e0b3877a8e18e7e27ddce
3
+ size 61940677
dapo_lorafa_20251201_161746/checkpoint-192/global_step192/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:597c8af5f7f3e61510ec6aed27bce76955fa292bd50705b7d6a16d01da8f3fd0
3
+ size 61940677
dapo_lorafa_20251201_161746/checkpoint-192/global_step192/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:deb70431aa09a4bc41dc312ed52638cbd8616f99962bca79397815716af6beaf
3
+ size 61940677
dapo_lorafa_20251201_161746/checkpoint-192/tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893
3
+ size 11422778
dapo_lorafa_20251201_161746/checkpoint-256/global_step256/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2685953f25ca45580a0a2240c0e474b0284e98b827b40503e7e30b2ad6ac50e4
3
+ size 61940677
dapo_lorafa_20251201_161746/checkpoint-256/global_step256/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:536d1471d4523a9a2bfcb4ea617881dbb100dcee33cf9d4bf831553241a9c28e
3
+ size 61940677
dapo_lorafa_20251201_161746/checkpoint-256/global_step256/mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:00acc84f3d3e9e233ca8d7a4dc417fee41508a797e2dc8917bfc76a09f9e26de
3
+ size 41536409
dapo_lorafa_20251201_161746/checkpoint-256/tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893
3
+ size 11422778
dapo_lorafa_20251201_161746/checkpoint-320/tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893
3
+ size 11422778
dapo_lorafa_20251201_161746/checkpoint-384/global_step384/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9f0a16b9dc17db898bae59c162b3cf419e1b4d861a625f7360e9321fdde40507
3
+ size 61940613
dapo_lorafa_20251201_161746/checkpoint-384/global_step384/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:28ec5a68c307c8dc3d371dd2bf4580a12743ce350de361ae4ca47aa7b43dcf4d
3
+ size 61940677
dapo_lorafa_20251201_161746/checkpoint-384/global_step384/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b30d03e1636d9c527541da6df2b8b8938f99af6b4f564b4804aebf0bb51d4a1b
3
+ size 61940677
dapo_lorafa_20251201_161746/checkpoint-384/global_step384/mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e98f8d324de72ecff3d649131bd26d9eca61e4e34b4b98399f139515cfb18fff
3
+ size 41536409
dapo_lorafa_20251201_161746/checkpoint-384/tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893
3
+ size 11422778
dapo_lorafa_20251201_161746/checkpoint-448/global_step448/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d81e97d15e6fa480cce405240eb50cbc00f44ff50799a592f807550acc67591a
3
+ size 61940677
dapo_lorafa_20251201_161746/checkpoint-448/global_step448/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9a3411b520790b93d79a3431b9a460b0ab21c3b82efb5ed2cbca783304c56a82
3
+ size 61940677
dapo_lorafa_20251201_161746/checkpoint-448/global_step448/mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3c50e55c50763947c54fafa3e9f4cfa5d2102a778471499d23eb168c12217809
3
+ size 41536409
dapo_lorafa_20251201_161746/checkpoint-448/tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893
3
+ size 11422778
dapo_lorafa_20251201_161746/checkpoint-512/adapter_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:10f7c55cfa44aa09f4f50b180fa3d7e8797f46db4296f441c8a732d1eeb599ce
3
+ size 73911504
dapo_lorafa_20251201_161746/checkpoint-512/tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893
3
+ size 11422778
dapo_lorafa_20251201_161746/checkpoint-64/tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893
3
+ size 11422778
dr_grpo_lora_20251130_192918/adapter_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3c240fdcf320931983992482f05fc28dcd8e7057793221a852f5b503423ece68
3
+ size 36981856
dr_grpo_lora_20251130_192918/checkpoint-1024/adapter_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3c240fdcf320931983992482f05fc28dcd8e7057793221a852f5b503423ece68
3
+ size 36981856
dr_grpo_lora_20251130_192918/checkpoint-1024/global_step1024/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e07acf7c70dff5f597da42945c635f0dcbe83e9c20cad54219b26b4eaa55df98
3
+ size 55408773
dr_grpo_lora_20251130_192918/checkpoint-1024/global_step1024/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fc8c3357cf78f747dd2d095e7a300086fee44a67ca087d0f452b7c71e11d0787
3
+ size 55408773
dr_grpo_lora_20251130_192918/checkpoint-1024/global_step1024/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cee69fffcac34efaf08ca00b0dc39e4109c8553c40dbe9eddb769876acfc2ac7
3
+ size 55408837
dr_grpo_lora_20251130_192918/checkpoint-1024/global_step1024/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b6a395a41cebbc4440326565cfc18c9d244316108fbbeb0822b63966d785332c
3
+ size 55408837
dr_grpo_lora_20251130_192918/checkpoint-1024/global_step1024/mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e0bdab265c8ccad1a01cd595d8e32176c936efb9e4275b4f29e7973b83c1438a
3
+ size 37231769
dr_grpo_lora_20251130_192918/checkpoint-1024/tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893
3
+ size 11422778
dr_grpo_lora_20251130_192918/checkpoint-128/adapter_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3b1cf05158410591c4925eef68e7b331415e22c8e3d52313f76557f92209b3b0
3
+ size 36981856
dr_grpo_lora_20251130_192918/checkpoint-128/global_step128/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9c58b748f37a99ca5d39320b531277ea41c5757d23007fff93812c13e389fda1
3
+ size 55408773
dr_grpo_lora_20251130_192918/checkpoint-128/global_step128/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3818383f1e8759d7a6c01dc368be8eb1ea2866ce62bafcd058312e7ecec7af02
3
+ size 55408837
dr_grpo_lora_20251130_192918/checkpoint-128/global_step128/mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6fccccc3b9974081797aa6b208287b9a35b61001ae6088cb89bb3b4f646ec373
3
+ size 37231769
dr_grpo_lora_20251130_192918/checkpoint-128/tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893
3
+ size 11422778
dr_grpo_lora_20251130_192918/checkpoint-192/adapter_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a7c7379d4c97ef84b02f0953aff107b17981c88b05464a919bb8f4151481b682
3
+ size 36981856
dr_grpo_lora_20251130_192918/checkpoint-192/global_step192/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:00ccafad6919abfa42d9b5f98e7965eef1b39a4719c8df5bd45c31835bdda0c4
3
+ size 55408837
dr_grpo_lora_20251130_192918/checkpoint-192/global_step192/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b54c1c33a4add084a0c82c5f2fade8abecec34d313d7543185e60451c4cc0462
3
+ size 55408837
dr_grpo_lora_20251130_192918/checkpoint-192/global_step192/mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8e2de8e7967ddb5fe57e6570bb90bfb20b7ce94bffe878fbf0edef23d0e56589
3
+ size 37231769
dr_grpo_lora_20251130_192918/checkpoint-192/tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893
3
+ size 11422778
dr_grpo_lora_20251130_192918/checkpoint-256/global_step256/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ca4349cab222a3861072adf3d027587a3d1b8562abb8a3a7f2c46e1256443f95
3
+ size 55408773
dr_grpo_lora_20251130_192918/checkpoint-256/global_step256/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ac64546122cf351c42dd2a6691a523e389b9b384eca0ad67b1488e31be8056c0
3
+ size 55408773
dr_grpo_lora_20251130_192918/checkpoint-256/global_step256/mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d597a6e90cbf3f4ef078fac0b651e6c0e6544daace6feec9076d1ba67ac05f63
3
+ size 37231769
dr_grpo_lora_20251130_192918/checkpoint-256/tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893
3
+ size 11422778
dr_grpo_lora_20251130_192918/checkpoint-320/global_step320/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9f7390edfde28624a3982f286a32cd8761da1fc5a321e9bab5245df7bfddb28b
3
+ size 55408773