gijs commited on
Commit
ebc504e
·
verified ·
1 Parent(s): 04a865e

Add files using upload-large-folder tool

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. .gitattributes +64 -0
  2. grpo/grpo-qwen2a-sft-simple-nolora-none-e1-bs2-lr1e-06-20250515_011354/checkpoint-11200/global_step11200/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
  3. grpo/grpo-qwen2a-sft-simple-nolora-none-e1-bs2-lr1e-06-20250515_011358/checkpoint-11200/global_step11200/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
  4. grpo/grpo-qwen2a-sft-simple-nolora-none-e1-bs2-lr1e-06-20250515_011358/checkpoint-11200/global_step11200/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt +3 -0
  5. grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_003349/runs/May16_00-33-53_gcn152.local.snellius.surf.nl/events.out.tfevents.1747348453.gcn152.local.snellius.surf.nl.1752330.0 +3 -0
  6. grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-11900/adapter_model.safetensors +3 -0
  7. grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-11900/global_step11900/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
  8. grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-11900/global_step11900/zero_pp_rank_0_mp_rank_00_model_states.pt +3 -0
  9. grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-11900/rng_state_0.pth +3 -0
  10. grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-11900/scheduler.pt +3 -0
  11. grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-11900/tokenizer.json +3 -0
  12. grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-12600/adapter_model.safetensors +3 -0
  13. grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-12600/global_step12600/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
  14. grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-12600/global_step12600/zero_pp_rank_0_mp_rank_00_model_states.pt +3 -0
  15. grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-12600/rng_state_0.pth +3 -0
  16. grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-12600/scheduler.pt +3 -0
  17. grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-12600/tokenizer.json +3 -0
  18. grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-12600/training_args.bin +3 -0
  19. grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-1400/adapter_model.safetensors +3 -0
  20. grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-1400/global_step1400/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
  21. grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-1400/global_step1400/zero_pp_rank_0_mp_rank_00_model_states.pt +3 -0
  22. grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-1400/rng_state_0.pth +3 -0
  23. grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-1400/scheduler.pt +3 -0
  24. grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-1400/tokenizer.json +3 -0
  25. grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-1400/training_args.bin +3 -0
  26. grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-2100/adapter_model.safetensors +3 -0
  27. grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-2100/global_step2100/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
  28. grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-2100/global_step2100/zero_pp_rank_0_mp_rank_00_model_states.pt +3 -0
  29. grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-2100/rng_state_0.pth +3 -0
  30. grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-2100/scheduler.pt +3 -0
  31. grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-2100/tokenizer.json +3 -0
  32. grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-2100/training_args.bin +3 -0
  33. grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-2800/adapter_model.safetensors +3 -0
  34. grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-2800/global_step2800/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
  35. grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-2800/global_step2800/zero_pp_rank_0_mp_rank_00_model_states.pt +3 -0
  36. grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-2800/rng_state_0.pth +3 -0
  37. grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-2800/scheduler.pt +3 -0
  38. grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-2800/tokenizer.json +3 -0
  39. grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-2800/training_args.bin +3 -0
  40. grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-3500/adapter_model.safetensors +3 -0
  41. grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-3500/global_step3500/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
  42. grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-3500/global_step3500/zero_pp_rank_0_mp_rank_00_model_states.pt +3 -0
  43. grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-3500/rng_state_0.pth +3 -0
  44. grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-3500/scheduler.pt +3 -0
  45. grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-3500/tokenizer.json +3 -0
  46. grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-3500/training_args.bin +3 -0
  47. grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-4200/adapter_model.safetensors +3 -0
  48. grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-4200/global_step4200/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
  49. grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-4200/global_step4200/zero_pp_rank_0_mp_rank_00_model_states.pt +3 -0
  50. grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-4200/rng_state_0.pth +3 -0
.gitattributes CHANGED
@@ -887,3 +887,67 @@ sft/20250429_133317_sftqwenomni-fullsimple-loraopt-1e-8bs-0.0002/checkpoint-7497
887
  sft/20250429_133317_sftqwenomni-fullsimple-loraopt-1e-8bs-0.0002/checkpoint-109056/tokenizer.json filter=lfs diff=lfs merge=lfs -text
888
  sft/20250429_133317_sftqwenomni-fullsimple-loraopt-1e-8bs-0.0002/checkpoint-47712/tokenizer.json filter=lfs diff=lfs merge=lfs -text
889
  sft/20250504_131507_sftqwenomni-semantic-loraopt-1e-4bs-0.0002/checkpoint-3327/tokenizer.json filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
887
  sft/20250429_133317_sftqwenomni-fullsimple-loraopt-1e-8bs-0.0002/checkpoint-109056/tokenizer.json filter=lfs diff=lfs merge=lfs -text
888
  sft/20250429_133317_sftqwenomni-fullsimple-loraopt-1e-8bs-0.0002/checkpoint-47712/tokenizer.json filter=lfs diff=lfs merge=lfs -text
889
  sft/20250504_131507_sftqwenomni-semantic-loraopt-1e-4bs-0.0002/checkpoint-3327/tokenizer.json filter=lfs diff=lfs merge=lfs -text
890
+ grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-11900/tokenizer.json filter=lfs diff=lfs merge=lfs -text
891
+ grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-9800/tokenizer.json filter=lfs diff=lfs merge=lfs -text
892
+ grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-3500/tokenizer.json filter=lfs diff=lfs merge=lfs -text
893
+ grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-700/tokenizer.json filter=lfs diff=lfs merge=lfs -text
894
+ grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-2800/tokenizer.json filter=lfs diff=lfs merge=lfs -text
895
+ grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-7700/tokenizer.json filter=lfs diff=lfs merge=lfs -text
896
+ grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-9100/tokenizer.json filter=lfs diff=lfs merge=lfs -text
897
+ grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-12600/tokenizer.json filter=lfs diff=lfs merge=lfs -text
898
+ grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-4200/tokenizer.json filter=lfs diff=lfs merge=lfs -text
899
+ grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-4900/tokenizer.json filter=lfs diff=lfs merge=lfs -text
900
+ grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-1400/tokenizer.json filter=lfs diff=lfs merge=lfs -text
901
+ grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-2100/tokenizer.json filter=lfs diff=lfs merge=lfs -text
902
+ grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-5600/tokenizer.json filter=lfs diff=lfs merge=lfs -text
903
+ grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-6300/tokenizer.json filter=lfs diff=lfs merge=lfs -text
904
+ grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_014243/checkpoint-8400/tokenizer.json filter=lfs diff=lfs merge=lfs -text
905
+ grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_014243/checkpoint-7000/tokenizer.json filter=lfs diff=lfs merge=lfs -text
906
+ grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_014243/checkpoint-3500/tokenizer.json filter=lfs diff=lfs merge=lfs -text
907
+ grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_014243/checkpoint-700/tokenizer.json filter=lfs diff=lfs merge=lfs -text
908
+ grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_014243/checkpoint-2800/tokenizer.json filter=lfs diff=lfs merge=lfs -text
909
+ grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_014243/checkpoint-7700/tokenizer.json filter=lfs diff=lfs merge=lfs -text
910
+ grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_014243/checkpoint-4200/tokenizer.json filter=lfs diff=lfs merge=lfs -text
911
+ grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_014243/checkpoint-4900/tokenizer.json filter=lfs diff=lfs merge=lfs -text
912
+ grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_014243/checkpoint-1400/tokenizer.json filter=lfs diff=lfs merge=lfs -text
913
+ grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_014243/checkpoint-2100/tokenizer.json filter=lfs diff=lfs merge=lfs -text
914
+ grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_014243/checkpoint-5600/tokenizer.json filter=lfs diff=lfs merge=lfs -text
915
+ grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_014243/checkpoint-6300/tokenizer.json filter=lfs diff=lfs merge=lfs -text
916
+ sft/20250503_210304_sftqwenomni-semantic-noneopt-1e-4bs-0.0002/checkpoint-3327/tokenizer.json filter=lfs diff=lfs merge=lfs -text
917
+ sft/20250502_131506_sftqwenomni-fullsemantic-loraopt-1e-8bs-0.0002/checkpoint-49816/tokenizer.json filter=lfs diff=lfs merge=lfs -text
918
+ sft/20250502_131506_sftqwenomni-fullsemantic-loraopt-1e-8bs-0.0002/checkpoint-43589/tokenizer.json filter=lfs diff=lfs merge=lfs -text
919
+ sft/20250502_131506_sftqwenomni-fullsemantic-loraopt-1e-8bs-0.0002/checkpoint-31135/tokenizer.json filter=lfs diff=lfs merge=lfs -text
920
+ sft/20250502_131506_sftqwenomni-fullsemantic-loraopt-1e-8bs-0.0002/checkpoint-37362/tokenizer.json filter=lfs diff=lfs merge=lfs -text
921
+ sft/20250502_131506_sftqwenomni-fullsemantic-loraopt-1e-8bs-0.0002/checkpoint-6227/tokenizer.json filter=lfs diff=lfs merge=lfs -text
922
+ sft/20250502_131506_sftqwenomni-fullsemantic-loraopt-1e-8bs-0.0002/checkpoint-18681/tokenizer.json filter=lfs diff=lfs merge=lfs -text
923
+ sft/20250502_131506_sftqwenomni-fullsemantic-loraopt-1e-8bs-0.0002/checkpoint-12454/tokenizer.json filter=lfs diff=lfs merge=lfs -text
924
+ sft/20250502_131506_sftqwenomni-fullsemantic-loraopt-1e-8bs-0.0002/checkpoint-24908/tokenizer.json filter=lfs diff=lfs merge=lfs -text
925
+ sft/20250411_032518_sfttraining_qwen2.5_semantic_mc_qa-loraopt-3e-8bs-0.0002/checkpoint-26622/tokenizer.json filter=lfs diff=lfs merge=lfs -text
926
+ sft/20250411_032518_sfttraining_qwen2.5_semantic_mc_qa-loraopt-3e-8bs-0.0002/checkpoint-57681/tokenizer.json filter=lfs diff=lfs merge=lfs -text
927
+ sft/20250411_032518_sfttraining_qwen2.5_semantic_mc_qa-loraopt-3e-8bs-0.0002/checkpoint-31059/tokenizer.json filter=lfs diff=lfs merge=lfs -text
928
+ sft/20250411_032518_sfttraining_qwen2.5_semantic_mc_qa-loraopt-3e-8bs-0.0002/checkpoint-70992/tokenizer.json filter=lfs diff=lfs merge=lfs -text
929
+ sft/20250411_032518_sfttraining_qwen2.5_semantic_mc_qa-loraopt-3e-8bs-0.0002/checkpoint-48807/tokenizer.json filter=lfs diff=lfs merge=lfs -text
930
+ sft/20250411_032518_sfttraining_qwen2.5_semantic_mc_qa-loraopt-3e-8bs-0.0002/checkpoint-75429/tokenizer.json filter=lfs diff=lfs merge=lfs -text
931
+ sft/20250411_032518_sfttraining_qwen2.5_semantic_mc_qa-loraopt-3e-8bs-0.0002/checkpoint-22185/tokenizer.json filter=lfs diff=lfs merge=lfs -text
932
+ sft/20250411_032518_sfttraining_qwen2.5_semantic_mc_qa-loraopt-3e-8bs-0.0002/checkpoint-39933/tokenizer.json filter=lfs diff=lfs merge=lfs -text
933
+ sft/20250411_032518_sfttraining_qwen2.5_semantic_mc_qa-loraopt-3e-8bs-0.0002/checkpoint-8874/tokenizer.json filter=lfs diff=lfs merge=lfs -text
934
+ sft/20250411_032518_sfttraining_qwen2.5_semantic_mc_qa-loraopt-3e-8bs-0.0002/checkpoint-17748/tokenizer.json filter=lfs diff=lfs merge=lfs -text
935
+ sft/20250411_032518_sfttraining_qwen2.5_semantic_mc_qa-loraopt-3e-8bs-0.0002/checkpoint-66555/tokenizer.json filter=lfs diff=lfs merge=lfs -text
936
+ sft/20250411_032518_sfttraining_qwen2.5_semantic_mc_qa-loraopt-3e-8bs-0.0002/checkpoint-62118/tokenizer.json filter=lfs diff=lfs merge=lfs -text
937
+ sft/20250411_032518_sfttraining_qwen2.5_semantic_mc_qa-loraopt-3e-8bs-0.0002/checkpoint-44370/tokenizer.json filter=lfs diff=lfs merge=lfs -text
938
+ sft/20250411_032518_sfttraining_qwen2.5_semantic_mc_qa-loraopt-3e-8bs-0.0002/checkpoint-53244/tokenizer.json filter=lfs diff=lfs merge=lfs -text
939
+ sft/20250411_032518_sfttraining_qwen2.5_semantic_mc_qa-loraopt-3e-8bs-0.0002/checkpoint-13311/tokenizer.json filter=lfs diff=lfs merge=lfs -text
940
+ sft/20250411_032518_sfttraining_qwen2.5_semantic_mc_qa-loraopt-3e-8bs-0.0002/checkpoint-35496/tokenizer.json filter=lfs diff=lfs merge=lfs -text
941
+ sft/20250411_032518_sfttraining_qwen2.5_semantic_mc_qa-loraopt-3e-8bs-0.0002/checkpoint-79868/tokenizer.json filter=lfs diff=lfs merge=lfs -text
942
+ sft/20250411_032518_sfttraining_qwen2.5_semantic_mc_qa-loraopt-3e-8bs-0.0002/checkpoint-79866/tokenizer.json filter=lfs diff=lfs merge=lfs -text
943
+ sft/20250411_032518_sfttraining_qwen2.5_semantic_mc_qa-loraopt-3e-8bs-0.0002/checkpoint-4437/tokenizer.json filter=lfs diff=lfs merge=lfs -text
944
+ sft/20250428_122030_sftqwen2a-semantic-fullyscratch-loraopt-5e-8bs-0.0002/checkpoint-11641/tokenizer.json filter=lfs diff=lfs merge=lfs -text
945
+ sft/20250428_122030_sftqwen2a-semantic-fullyscratch-loraopt-5e-8bs-0.0002/checkpoint-16630/tokenizer.json filter=lfs diff=lfs merge=lfs -text
946
+ sft/20250428_122030_sftqwen2a-semantic-fullyscratch-loraopt-5e-8bs-0.0002/checkpoint-1663/tokenizer.json filter=lfs diff=lfs merge=lfs -text
947
+ sft/20250428_122030_sftqwen2a-semantic-fullyscratch-loraopt-5e-8bs-0.0002/checkpoint-14967/tokenizer.json filter=lfs diff=lfs merge=lfs -text
948
+ sft/20250428_122030_sftqwen2a-semantic-fullyscratch-loraopt-5e-8bs-0.0002/checkpoint-8315/tokenizer.json filter=lfs diff=lfs merge=lfs -text
949
+ sft/20250428_122030_sftqwen2a-semantic-fullyscratch-loraopt-5e-8bs-0.0002/checkpoint-3326/tokenizer.json filter=lfs diff=lfs merge=lfs -text
950
+ sft/20250428_122030_sftqwen2a-semantic-fullyscratch-loraopt-5e-8bs-0.0002/checkpoint-19956/tokenizer.json filter=lfs diff=lfs merge=lfs -text
951
+ sft/20250428_122030_sftqwen2a-semantic-fullyscratch-loraopt-5e-8bs-0.0002/checkpoint-4989/tokenizer.json filter=lfs diff=lfs merge=lfs -text
952
+ sft/20250428_122030_sftqwen2a-semantic-fullyscratch-loraopt-5e-8bs-0.0002/checkpoint-23282/tokenizer.json filter=lfs diff=lfs merge=lfs -text
953
+ sft/20250428_122030_sftqwen2a-semantic-fullyscratch-loraopt-5e-8bs-0.0002/checkpoint-21619/tokenizer.json filter=lfs diff=lfs merge=lfs -text
grpo/grpo-qwen2a-sft-simple-nolora-none-e1-bs2-lr1e-06-20250515_011354/checkpoint-11200/global_step11200/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3d42ff5888e4976e5ddbbf573dc87c3c7b636b6453fd7183a72bf9d693e8b4a7
3
+ size 33580713114
grpo/grpo-qwen2a-sft-simple-nolora-none-e1-bs2-lr1e-06-20250515_011358/checkpoint-11200/global_step11200/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f146dc48491e1d4e1735edabd20c057f5964ca7be6de6ab586a0324856e964df
3
+ size 33580713114
grpo/grpo-qwen2a-sft-simple-nolora-none-e1-bs2-lr1e-06-20250515_011358/checkpoint-11200/global_step11200/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7ca0e2fbbb3446fcd75a44b8a50c7b432f0426712f79a675bafba5eae5ec19f3
3
+ size 33580713114
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_003349/runs/May16_00-33-53_gcn152.local.snellius.surf.nl/events.out.tfevents.1747348453.gcn152.local.snellius.surf.nl.1752330.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ae2a7eed72cce0c9c3ec653d85ff813a68277331ac9c7793576df999d4a016f9
3
+ size 7049
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-11900/adapter_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bc8e095bc6441f95e6e8e29cf6b66eba7d88d2cfa7ccafdb22f3ee09a2c44d21
3
+ size 11046672
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-11900/global_step11900/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a03480640ed5ac664b89dd8bba61ff21ad82ace3158d8c800678e19f0670df22
3
+ size 22025200
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-11900/global_step11900/zero_pp_rank_0_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b60c4cb704b5701c80a22443d48fd695672555422ddba574e1eaba8dc94de710
3
+ size 321070
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-11900/rng_state_0.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:79b3ba706a3c67682432b88064a5705fc6d1d4f249d720213a1403096aa2aeac
3
+ size 14768
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-11900/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fbb714ea7623877789f2e62f6d68e51e0e5c7ab0a7bc37d3189492ff784f3bb0
3
+ size 1064
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-11900/tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e56eaebf99a63995f420cf1d71d671180c414ff523f363350b20c982ef29d5b6
3
+ size 12030943
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-12600/adapter_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:28d66de4fbd4e2f6e5a8eaae446968f1aa8ae0e6b0182620dd4c4af3ca34eaa2
3
+ size 11046672
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-12600/global_step12600/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d92a8b33c5c2010da3593d76f682ba76f22448553a292437bbe948eada39927f
3
+ size 22025200
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-12600/global_step12600/zero_pp_rank_0_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:518b2cd16d6969e57d8b8402f0cf731a6d26a9aa3bed3a2a73ae8cffaf1d6582
3
+ size 321070
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-12600/rng_state_0.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a1f9c3210fe4d3362c8db4461673a1d3bfce46d45a7350d2a73774ef53042702
3
+ size 14768
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-12600/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b5fd0f9b1cccf58217568759d259cdb618ff306f938fcab6b52cddb5f66111f3
3
+ size 1064
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-12600/tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e56eaebf99a63995f420cf1d71d671180c414ff523f363350b20c982ef29d5b6
3
+ size 12030943
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-12600/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:443b792ec5905e6302337c43bbf96699044effb11e28baca15b086682c014569
3
+ size 7928
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-1400/adapter_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:818cfaa1140b229a7404535be9b4ec1219b9ca9cc367407e2dad5d2dcbad1e12
3
+ size 11046672
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-1400/global_step1400/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b20fefca488a0c1ae1a820d2a631b7dcbd0f328e15da0827de2b97952b92648
3
+ size 22025200
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-1400/global_step1400/zero_pp_rank_0_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:673e16af27dd5a252e1ffa5954a7a34785a920ec1daa381e607041627a5ea3fb
3
+ size 321070
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-1400/rng_state_0.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d2de562643ee968768bbaf486808a517d5c348aa2b2447b6bbadf0b2b01a2926
3
+ size 14768
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-1400/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b271d283c76a220dc934ebcce83f89e813dd71201468502f3b652928e3dc3d36
3
+ size 1064
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-1400/tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e56eaebf99a63995f420cf1d71d671180c414ff523f363350b20c982ef29d5b6
3
+ size 12030943
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-1400/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:443b792ec5905e6302337c43bbf96699044effb11e28baca15b086682c014569
3
+ size 7928
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-2100/adapter_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f2a8407a816b4f30cfa691696cd99aa310ac1ba8ab8953085fe6fe3382422fdf
3
+ size 11046672
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-2100/global_step2100/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0e432a870536041629a10faf9497af470027e75ad9c6895c38792bb0571ca28e
3
+ size 22025200
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-2100/global_step2100/zero_pp_rank_0_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a696cd3bf8e494110f2a1d4f57ccbbaf65fcae5f496e0180eeae0d3ed5e2a109
3
+ size 321070
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-2100/rng_state_0.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d74a4515646c8b0e5f9559bda6f8c3d2bed7194867308f6c23545fd9737be3bc
3
+ size 14768
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-2100/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dfb8972d97ba2ca80d4b89051bd72d12b4d6ea66122128610c3e3402f4dbc586
3
+ size 1064
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-2100/tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e56eaebf99a63995f420cf1d71d671180c414ff523f363350b20c982ef29d5b6
3
+ size 12030943
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-2100/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:443b792ec5905e6302337c43bbf96699044effb11e28baca15b086682c014569
3
+ size 7928
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-2800/adapter_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a5616a261c608996aeca1c1cb05424d5a3049d85450b7a49566e99d14498cf7a
3
+ size 11046672
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-2800/global_step2800/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:be0cf02a71cc86afe583ae95bf06a80e7d20c43a456ad00ebbb309dead472687
3
+ size 22025200
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-2800/global_step2800/zero_pp_rank_0_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dfbeb165b793dddc5a57a77511696beea836dc3fe4788466d686f4e1abe71030
3
+ size 321070
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-2800/rng_state_0.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:af9a12b65ac8bda2f72aaf1ae8a3f7bd2d168a097e720d219838f6c1d4672930
3
+ size 14768
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-2800/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7b29389e582918d7b983b339df8c92a179c0ba93fc0319ddd17523d6df418518
3
+ size 1064
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-2800/tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e56eaebf99a63995f420cf1d71d671180c414ff523f363350b20c982ef29d5b6
3
+ size 12030943
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-2800/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:443b792ec5905e6302337c43bbf96699044effb11e28baca15b086682c014569
3
+ size 7928
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-3500/adapter_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6b2cda54b44fc92007452897572ce51445b8f2f41a56a167b11ad5fe6b5422c2
3
+ size 11046672
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-3500/global_step3500/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7843e040e6f509ce25881a99cc3cedb5d56b976cc7f7ca03df8cabc10d92141f
3
+ size 22025200
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-3500/global_step3500/zero_pp_rank_0_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:015cf4f601e258849a012f2b1e8a1fb8d942eeab7c860686796297d18987cb7f
3
+ size 321070
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-3500/rng_state_0.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f305f51c847d422a924b60c23a8b9cb9f6682e4d580f73b1bd0c06c4420f0c44
3
+ size 14768
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-3500/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cc35fdf33cc8349082c268dcdc4e6f9c9dc49ec32293bbfa7e76eea7ee934590
3
+ size 1064
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-3500/tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e56eaebf99a63995f420cf1d71d671180c414ff523f363350b20c982ef29d5b6
3
+ size 12030943
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-3500/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:443b792ec5905e6302337c43bbf96699044effb11e28baca15b086682c014569
3
+ size 7928
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-4200/adapter_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4d2bfbfffadfdadb1d107966c1240d7b768a8d0349aff66788416cd2105bfba0
3
+ size 11046672
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-4200/global_step4200/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e9d7d3e291f29f47375513c6d4217960c98a208778db0b9729060d4bcfa9ef96
3
+ size 22025200
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-4200/global_step4200/zero_pp_rank_0_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:892e119f92a4a3fb9f807125dbb00c8015ed848d75bc306b413be07f6cbd3d56
3
+ size 321070
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-4200/rng_state_0.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9391a908c471412ac3012ce12913d6d975202aa87d2d9dfe8aeec9d1fcdb661f
3
+ size 14768