Add files using upload-large-folder tool
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +64 -0
- grpo/grpo-qwen2a-sft-simple-nolora-none-e1-bs2-lr1e-06-20250515_011354/checkpoint-11200/global_step11200/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
- grpo/grpo-qwen2a-sft-simple-nolora-none-e1-bs2-lr1e-06-20250515_011358/checkpoint-11200/global_step11200/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
- grpo/grpo-qwen2a-sft-simple-nolora-none-e1-bs2-lr1e-06-20250515_011358/checkpoint-11200/global_step11200/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt +3 -0
- grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_003349/runs/May16_00-33-53_gcn152.local.snellius.surf.nl/events.out.tfevents.1747348453.gcn152.local.snellius.surf.nl.1752330.0 +3 -0
- grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-11900/adapter_model.safetensors +3 -0
- grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-11900/global_step11900/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
- grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-11900/global_step11900/zero_pp_rank_0_mp_rank_00_model_states.pt +3 -0
- grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-11900/rng_state_0.pth +3 -0
- grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-11900/scheduler.pt +3 -0
- grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-11900/tokenizer.json +3 -0
- grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-12600/adapter_model.safetensors +3 -0
- grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-12600/global_step12600/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
- grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-12600/global_step12600/zero_pp_rank_0_mp_rank_00_model_states.pt +3 -0
- grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-12600/rng_state_0.pth +3 -0
- grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-12600/scheduler.pt +3 -0
- grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-12600/tokenizer.json +3 -0
- grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-12600/training_args.bin +3 -0
- grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-1400/adapter_model.safetensors +3 -0
- grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-1400/global_step1400/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
- grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-1400/global_step1400/zero_pp_rank_0_mp_rank_00_model_states.pt +3 -0
- grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-1400/rng_state_0.pth +3 -0
- grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-1400/scheduler.pt +3 -0
- grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-1400/tokenizer.json +3 -0
- grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-1400/training_args.bin +3 -0
- grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-2100/adapter_model.safetensors +3 -0
- grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-2100/global_step2100/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
- grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-2100/global_step2100/zero_pp_rank_0_mp_rank_00_model_states.pt +3 -0
- grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-2100/rng_state_0.pth +3 -0
- grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-2100/scheduler.pt +3 -0
- grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-2100/tokenizer.json +3 -0
- grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-2100/training_args.bin +3 -0
- grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-2800/adapter_model.safetensors +3 -0
- grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-2800/global_step2800/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
- grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-2800/global_step2800/zero_pp_rank_0_mp_rank_00_model_states.pt +3 -0
- grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-2800/rng_state_0.pth +3 -0
- grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-2800/scheduler.pt +3 -0
- grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-2800/tokenizer.json +3 -0
- grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-2800/training_args.bin +3 -0
- grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-3500/adapter_model.safetensors +3 -0
- grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-3500/global_step3500/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
- grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-3500/global_step3500/zero_pp_rank_0_mp_rank_00_model_states.pt +3 -0
- grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-3500/rng_state_0.pth +3 -0
- grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-3500/scheduler.pt +3 -0
- grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-3500/tokenizer.json +3 -0
- grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-3500/training_args.bin +3 -0
- grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-4200/adapter_model.safetensors +3 -0
- grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-4200/global_step4200/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
- grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-4200/global_step4200/zero_pp_rank_0_mp_rank_00_model_states.pt +3 -0
- grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-4200/rng_state_0.pth +3 -0
.gitattributes
CHANGED
|
@@ -887,3 +887,67 @@ sft/20250429_133317_sftqwenomni-fullsimple-loraopt-1e-8bs-0.0002/checkpoint-7497
|
|
| 887 |
sft/20250429_133317_sftqwenomni-fullsimple-loraopt-1e-8bs-0.0002/checkpoint-109056/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 888 |
sft/20250429_133317_sftqwenomni-fullsimple-loraopt-1e-8bs-0.0002/checkpoint-47712/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 889 |
sft/20250504_131507_sftqwenomni-semantic-loraopt-1e-4bs-0.0002/checkpoint-3327/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 887 |
sft/20250429_133317_sftqwenomni-fullsimple-loraopt-1e-8bs-0.0002/checkpoint-109056/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 888 |
sft/20250429_133317_sftqwenomni-fullsimple-loraopt-1e-8bs-0.0002/checkpoint-47712/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 889 |
sft/20250504_131507_sftqwenomni-semantic-loraopt-1e-4bs-0.0002/checkpoint-3327/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 890 |
+
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-11900/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 891 |
+
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-9800/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 892 |
+
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-3500/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 893 |
+
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-700/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 894 |
+
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-2800/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 895 |
+
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-7700/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 896 |
+
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-9100/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 897 |
+
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-12600/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 898 |
+
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-4200/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 899 |
+
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-4900/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 900 |
+
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-1400/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 901 |
+
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-2100/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 902 |
+
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-5600/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 903 |
+
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-6300/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 904 |
+
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_014243/checkpoint-8400/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 905 |
+
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_014243/checkpoint-7000/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 906 |
+
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_014243/checkpoint-3500/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 907 |
+
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_014243/checkpoint-700/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 908 |
+
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_014243/checkpoint-2800/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 909 |
+
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_014243/checkpoint-7700/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 910 |
+
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_014243/checkpoint-4200/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 911 |
+
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_014243/checkpoint-4900/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 912 |
+
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_014243/checkpoint-1400/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 913 |
+
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_014243/checkpoint-2100/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 914 |
+
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_014243/checkpoint-5600/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 915 |
+
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_014243/checkpoint-6300/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 916 |
+
sft/20250503_210304_sftqwenomni-semantic-noneopt-1e-4bs-0.0002/checkpoint-3327/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 917 |
+
sft/20250502_131506_sftqwenomni-fullsemantic-loraopt-1e-8bs-0.0002/checkpoint-49816/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 918 |
+
sft/20250502_131506_sftqwenomni-fullsemantic-loraopt-1e-8bs-0.0002/checkpoint-43589/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 919 |
+
sft/20250502_131506_sftqwenomni-fullsemantic-loraopt-1e-8bs-0.0002/checkpoint-31135/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 920 |
+
sft/20250502_131506_sftqwenomni-fullsemantic-loraopt-1e-8bs-0.0002/checkpoint-37362/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 921 |
+
sft/20250502_131506_sftqwenomni-fullsemantic-loraopt-1e-8bs-0.0002/checkpoint-6227/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 922 |
+
sft/20250502_131506_sftqwenomni-fullsemantic-loraopt-1e-8bs-0.0002/checkpoint-18681/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 923 |
+
sft/20250502_131506_sftqwenomni-fullsemantic-loraopt-1e-8bs-0.0002/checkpoint-12454/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 924 |
+
sft/20250502_131506_sftqwenomni-fullsemantic-loraopt-1e-8bs-0.0002/checkpoint-24908/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 925 |
+
sft/20250411_032518_sfttraining_qwen2.5_semantic_mc_qa-loraopt-3e-8bs-0.0002/checkpoint-26622/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 926 |
+
sft/20250411_032518_sfttraining_qwen2.5_semantic_mc_qa-loraopt-3e-8bs-0.0002/checkpoint-57681/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 927 |
+
sft/20250411_032518_sfttraining_qwen2.5_semantic_mc_qa-loraopt-3e-8bs-0.0002/checkpoint-31059/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 928 |
+
sft/20250411_032518_sfttraining_qwen2.5_semantic_mc_qa-loraopt-3e-8bs-0.0002/checkpoint-70992/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 929 |
+
sft/20250411_032518_sfttraining_qwen2.5_semantic_mc_qa-loraopt-3e-8bs-0.0002/checkpoint-48807/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 930 |
+
sft/20250411_032518_sfttraining_qwen2.5_semantic_mc_qa-loraopt-3e-8bs-0.0002/checkpoint-75429/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 931 |
+
sft/20250411_032518_sfttraining_qwen2.5_semantic_mc_qa-loraopt-3e-8bs-0.0002/checkpoint-22185/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 932 |
+
sft/20250411_032518_sfttraining_qwen2.5_semantic_mc_qa-loraopt-3e-8bs-0.0002/checkpoint-39933/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 933 |
+
sft/20250411_032518_sfttraining_qwen2.5_semantic_mc_qa-loraopt-3e-8bs-0.0002/checkpoint-8874/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 934 |
+
sft/20250411_032518_sfttraining_qwen2.5_semantic_mc_qa-loraopt-3e-8bs-0.0002/checkpoint-17748/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 935 |
+
sft/20250411_032518_sfttraining_qwen2.5_semantic_mc_qa-loraopt-3e-8bs-0.0002/checkpoint-66555/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 936 |
+
sft/20250411_032518_sfttraining_qwen2.5_semantic_mc_qa-loraopt-3e-8bs-0.0002/checkpoint-62118/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 937 |
+
sft/20250411_032518_sfttraining_qwen2.5_semantic_mc_qa-loraopt-3e-8bs-0.0002/checkpoint-44370/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 938 |
+
sft/20250411_032518_sfttraining_qwen2.5_semantic_mc_qa-loraopt-3e-8bs-0.0002/checkpoint-53244/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 939 |
+
sft/20250411_032518_sfttraining_qwen2.5_semantic_mc_qa-loraopt-3e-8bs-0.0002/checkpoint-13311/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 940 |
+
sft/20250411_032518_sfttraining_qwen2.5_semantic_mc_qa-loraopt-3e-8bs-0.0002/checkpoint-35496/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 941 |
+
sft/20250411_032518_sfttraining_qwen2.5_semantic_mc_qa-loraopt-3e-8bs-0.0002/checkpoint-79868/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 942 |
+
sft/20250411_032518_sfttraining_qwen2.5_semantic_mc_qa-loraopt-3e-8bs-0.0002/checkpoint-79866/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 943 |
+
sft/20250411_032518_sfttraining_qwen2.5_semantic_mc_qa-loraopt-3e-8bs-0.0002/checkpoint-4437/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 944 |
+
sft/20250428_122030_sftqwen2a-semantic-fullyscratch-loraopt-5e-8bs-0.0002/checkpoint-11641/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 945 |
+
sft/20250428_122030_sftqwen2a-semantic-fullyscratch-loraopt-5e-8bs-0.0002/checkpoint-16630/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 946 |
+
sft/20250428_122030_sftqwen2a-semantic-fullyscratch-loraopt-5e-8bs-0.0002/checkpoint-1663/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 947 |
+
sft/20250428_122030_sftqwen2a-semantic-fullyscratch-loraopt-5e-8bs-0.0002/checkpoint-14967/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 948 |
+
sft/20250428_122030_sftqwen2a-semantic-fullyscratch-loraopt-5e-8bs-0.0002/checkpoint-8315/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 949 |
+
sft/20250428_122030_sftqwen2a-semantic-fullyscratch-loraopt-5e-8bs-0.0002/checkpoint-3326/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 950 |
+
sft/20250428_122030_sftqwen2a-semantic-fullyscratch-loraopt-5e-8bs-0.0002/checkpoint-19956/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 951 |
+
sft/20250428_122030_sftqwen2a-semantic-fullyscratch-loraopt-5e-8bs-0.0002/checkpoint-4989/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 952 |
+
sft/20250428_122030_sftqwen2a-semantic-fullyscratch-loraopt-5e-8bs-0.0002/checkpoint-23282/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 953 |
+
sft/20250428_122030_sftqwen2a-semantic-fullyscratch-loraopt-5e-8bs-0.0002/checkpoint-21619/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
grpo/grpo-qwen2a-sft-simple-nolora-none-e1-bs2-lr1e-06-20250515_011354/checkpoint-11200/global_step11200/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3d42ff5888e4976e5ddbbf573dc87c3c7b636b6453fd7183a72bf9d693e8b4a7
|
| 3 |
+
size 33580713114
|
grpo/grpo-qwen2a-sft-simple-nolora-none-e1-bs2-lr1e-06-20250515_011358/checkpoint-11200/global_step11200/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f146dc48491e1d4e1735edabd20c057f5964ca7be6de6ab586a0324856e964df
|
| 3 |
+
size 33580713114
|
grpo/grpo-qwen2a-sft-simple-nolora-none-e1-bs2-lr1e-06-20250515_011358/checkpoint-11200/global_step11200/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7ca0e2fbbb3446fcd75a44b8a50c7b432f0426712f79a675bafba5eae5ec19f3
|
| 3 |
+
size 33580713114
|
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_003349/runs/May16_00-33-53_gcn152.local.snellius.surf.nl/events.out.tfevents.1747348453.gcn152.local.snellius.surf.nl.1752330.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ae2a7eed72cce0c9c3ec653d85ff813a68277331ac9c7793576df999d4a016f9
|
| 3 |
+
size 7049
|
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-11900/adapter_model.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:bc8e095bc6441f95e6e8e29cf6b66eba7d88d2cfa7ccafdb22f3ee09a2c44d21
|
| 3 |
+
size 11046672
|
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-11900/global_step11900/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a03480640ed5ac664b89dd8bba61ff21ad82ace3158d8c800678e19f0670df22
|
| 3 |
+
size 22025200
|
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-11900/global_step11900/zero_pp_rank_0_mp_rank_00_model_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b60c4cb704b5701c80a22443d48fd695672555422ddba574e1eaba8dc94de710
|
| 3 |
+
size 321070
|
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-11900/rng_state_0.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:79b3ba706a3c67682432b88064a5705fc6d1d4f249d720213a1403096aa2aeac
|
| 3 |
+
size 14768
|
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-11900/scheduler.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fbb714ea7623877789f2e62f6d68e51e0e5c7ab0a7bc37d3189492ff784f3bb0
|
| 3 |
+
size 1064
|
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-11900/tokenizer.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e56eaebf99a63995f420cf1d71d671180c414ff523f363350b20c982ef29d5b6
|
| 3 |
+
size 12030943
|
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-12600/adapter_model.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:28d66de4fbd4e2f6e5a8eaae446968f1aa8ae0e6b0182620dd4c4af3ca34eaa2
|
| 3 |
+
size 11046672
|
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-12600/global_step12600/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d92a8b33c5c2010da3593d76f682ba76f22448553a292437bbe948eada39927f
|
| 3 |
+
size 22025200
|
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-12600/global_step12600/zero_pp_rank_0_mp_rank_00_model_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:518b2cd16d6969e57d8b8402f0cf731a6d26a9aa3bed3a2a73ae8cffaf1d6582
|
| 3 |
+
size 321070
|
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-12600/rng_state_0.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a1f9c3210fe4d3362c8db4461673a1d3bfce46d45a7350d2a73774ef53042702
|
| 3 |
+
size 14768
|
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-12600/scheduler.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b5fd0f9b1cccf58217568759d259cdb618ff306f938fcab6b52cddb5f66111f3
|
| 3 |
+
size 1064
|
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-12600/tokenizer.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e56eaebf99a63995f420cf1d71d671180c414ff523f363350b20c982ef29d5b6
|
| 3 |
+
size 12030943
|
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-12600/training_args.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:443b792ec5905e6302337c43bbf96699044effb11e28baca15b086682c014569
|
| 3 |
+
size 7928
|
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-1400/adapter_model.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:818cfaa1140b229a7404535be9b4ec1219b9ca9cc367407e2dad5d2dcbad1e12
|
| 3 |
+
size 11046672
|
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-1400/global_step1400/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5b20fefca488a0c1ae1a820d2a631b7dcbd0f328e15da0827de2b97952b92648
|
| 3 |
+
size 22025200
|
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-1400/global_step1400/zero_pp_rank_0_mp_rank_00_model_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:673e16af27dd5a252e1ffa5954a7a34785a920ec1daa381e607041627a5ea3fb
|
| 3 |
+
size 321070
|
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-1400/rng_state_0.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d2de562643ee968768bbaf486808a517d5c348aa2b2447b6bbadf0b2b01a2926
|
| 3 |
+
size 14768
|
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-1400/scheduler.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b271d283c76a220dc934ebcce83f89e813dd71201468502f3b652928e3dc3d36
|
| 3 |
+
size 1064
|
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-1400/tokenizer.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e56eaebf99a63995f420cf1d71d671180c414ff523f363350b20c982ef29d5b6
|
| 3 |
+
size 12030943
|
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-1400/training_args.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:443b792ec5905e6302337c43bbf96699044effb11e28baca15b086682c014569
|
| 3 |
+
size 7928
|
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-2100/adapter_model.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f2a8407a816b4f30cfa691696cd99aa310ac1ba8ab8953085fe6fe3382422fdf
|
| 3 |
+
size 11046672
|
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-2100/global_step2100/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0e432a870536041629a10faf9497af470027e75ad9c6895c38792bb0571ca28e
|
| 3 |
+
size 22025200
|
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-2100/global_step2100/zero_pp_rank_0_mp_rank_00_model_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a696cd3bf8e494110f2a1d4f57ccbbaf65fcae5f496e0180eeae0d3ed5e2a109
|
| 3 |
+
size 321070
|
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-2100/rng_state_0.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d74a4515646c8b0e5f9559bda6f8c3d2bed7194867308f6c23545fd9737be3bc
|
| 3 |
+
size 14768
|
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-2100/scheduler.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:dfb8972d97ba2ca80d4b89051bd72d12b4d6ea66122128610c3e3402f4dbc586
|
| 3 |
+
size 1064
|
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-2100/tokenizer.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e56eaebf99a63995f420cf1d71d671180c414ff523f363350b20c982ef29d5b6
|
| 3 |
+
size 12030943
|
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-2100/training_args.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:443b792ec5905e6302337c43bbf96699044effb11e28baca15b086682c014569
|
| 3 |
+
size 7928
|
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-2800/adapter_model.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a5616a261c608996aeca1c1cb05424d5a3049d85450b7a49566e99d14498cf7a
|
| 3 |
+
size 11046672
|
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-2800/global_step2800/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:be0cf02a71cc86afe583ae95bf06a80e7d20c43a456ad00ebbb309dead472687
|
| 3 |
+
size 22025200
|
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-2800/global_step2800/zero_pp_rank_0_mp_rank_00_model_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:dfbeb165b793dddc5a57a77511696beea836dc3fe4788466d686f4e1abe71030
|
| 3 |
+
size 321070
|
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-2800/rng_state_0.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:af9a12b65ac8bda2f72aaf1ae8a3f7bd2d168a097e720d219838f6c1d4672930
|
| 3 |
+
size 14768
|
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-2800/scheduler.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7b29389e582918d7b983b339df8c92a179c0ba93fc0319ddd17523d6df418518
|
| 3 |
+
size 1064
|
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-2800/tokenizer.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e56eaebf99a63995f420cf1d71d671180c414ff523f363350b20c982ef29d5b6
|
| 3 |
+
size 12030943
|
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-2800/training_args.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:443b792ec5905e6302337c43bbf96699044effb11e28baca15b086682c014569
|
| 3 |
+
size 7928
|
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-3500/adapter_model.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6b2cda54b44fc92007452897572ce51445b8f2f41a56a167b11ad5fe6b5422c2
|
| 3 |
+
size 11046672
|
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-3500/global_step3500/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7843e040e6f509ce25881a99cc3cedb5d56b976cc7f7ca03df8cabc10d92141f
|
| 3 |
+
size 22025200
|
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-3500/global_step3500/zero_pp_rank_0_mp_rank_00_model_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:015cf4f601e258849a012f2b1e8a1fb8d942eeab7c860686796297d18987cb7f
|
| 3 |
+
size 321070
|
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-3500/rng_state_0.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f305f51c847d422a924b60c23a8b9cb9f6682e4d580f73b1bd0c06c4420f0c44
|
| 3 |
+
size 14768
|
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-3500/scheduler.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:cc35fdf33cc8349082c268dcdc4e6f9c9dc49ec32293bbfa7e76eea7ee934590
|
| 3 |
+
size 1064
|
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-3500/tokenizer.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e56eaebf99a63995f420cf1d71d671180c414ff523f363350b20c982ef29d5b6
|
| 3 |
+
size 12030943
|
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-3500/training_args.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:443b792ec5905e6302337c43bbf96699044effb11e28baca15b086682c014569
|
| 3 |
+
size 7928
|
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-4200/adapter_model.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4d2bfbfffadfdadb1d107966c1240d7b768a8d0349aff66788416cd2105bfba0
|
| 3 |
+
size 11046672
|
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-4200/global_step4200/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e9d7d3e291f29f47375513c6d4217960c98a208778db0b9729060d4bcfa9ef96
|
| 3 |
+
size 22025200
|
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-4200/global_step4200/zero_pp_rank_0_mp_rank_00_model_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:892e119f92a4a3fb9f807125dbb00c8015ed848d75bc306b413be07f6cbd3d56
|
| 3 |
+
size 321070
|
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-4200/rng_state_0.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9391a908c471412ac3012ce12913d6d975202aa87d2d9dfe8aeec9d1fcdb661f
|
| 3 |
+
size 14768
|