diff --git a/.gitattributes b/.gitattributes index 81b7cf71a657747be890728bb3c9d98095173e1c..d1d3d6442e6d207bf8f7714d703ea1ca752a15d2 100644 --- a/.gitattributes +++ b/.gitattributes @@ -49,3 +49,11 @@ saves-sft-1016-2/saves-sft-1016-2/Qwen/Qwen3-4B/lora/sft/checkpoint-56/tokenizer saves-sft-1016-2/saves-sft-1016-2/Qwen/Qwen3-4B/lora/sft/tokenizer.json filter=lfs diff=lfs merge=lfs -text saves-sft-1016-2/saves-sft-1016-2/Qwen/Qwen3-8B/lora/sft/checkpoint-56/tokenizer.json filter=lfs diff=lfs merge=lfs -text saves-sft-1016-2/saves-sft-1016-2/Qwen/Qwen3-8B/lora/sft/tokenizer.json filter=lfs diff=lfs merge=lfs -text +GRPO/Qwen2.5-1.5B-Instruct/tokenizer.json filter=lfs diff=lfs merge=lfs -text +GRPO/Qwen2.5-7B-Instruct/tokenizer.json filter=lfs diff=lfs merge=lfs -text +GRPO/Qwen3-4B/tokenizer.json filter=lfs diff=lfs merge=lfs -text +GRPO/Qwen3-8B/tokenizer.json filter=lfs diff=lfs merge=lfs -text +SFT/Qwen2.5-1.5B-Instruct/tokenizer.json filter=lfs diff=lfs merge=lfs -text +SFT/Qwen2.5-7B-Instruct/tokenizer.json filter=lfs diff=lfs merge=lfs -text +SFT/Qwen3-4B/tokenizer.json filter=lfs diff=lfs merge=lfs -text +SFT/Qwen3-8B/tokenizer.json filter=lfs diff=lfs merge=lfs -text diff --git a/Qwen-grpo/Qwen2.5-1.5B-Instruct/added_tokens.json b/GRPO/Qwen2.5-1.5B-Instruct/added_tokens.json similarity index 100% rename from Qwen-grpo/Qwen2.5-1.5B-Instruct/added_tokens.json rename to GRPO/Qwen2.5-1.5B-Instruct/added_tokens.json diff --git a/Qwen-grpo/Qwen2.5-1.5B-Instruct/chat_template.jinja b/GRPO/Qwen2.5-1.5B-Instruct/chat_template.jinja similarity index 100% rename from Qwen-grpo/Qwen2.5-1.5B-Instruct/chat_template.jinja rename to GRPO/Qwen2.5-1.5B-Instruct/chat_template.jinja diff --git a/Qwen-grpo/Qwen2.5-1.5B-Instruct/config.json b/GRPO/Qwen2.5-1.5B-Instruct/config.json similarity index 100% rename from Qwen-grpo/Qwen2.5-1.5B-Instruct/config.json rename to GRPO/Qwen2.5-1.5B-Instruct/config.json diff --git a/Qwen-grpo/Qwen2.5-1.5B-Instruct/generation_config.json b/GRPO/Qwen2.5-1.5B-Instruct/generation_config.json similarity index 100% rename from Qwen-grpo/Qwen2.5-1.5B-Instruct/generation_config.json rename to GRPO/Qwen2.5-1.5B-Instruct/generation_config.json diff --git a/Qwen-grpo/Qwen2.5-1.5B-Instruct/merges.txt b/GRPO/Qwen2.5-1.5B-Instruct/merges.txt similarity index 100% rename from Qwen-grpo/Qwen2.5-1.5B-Instruct/merges.txt rename to GRPO/Qwen2.5-1.5B-Instruct/merges.txt diff --git a/Qwen-grpo/Qwen2.5-1.5B-Instruct/model.safetensors b/GRPO/Qwen2.5-1.5B-Instruct/model.safetensors similarity index 100% rename from Qwen-grpo/Qwen2.5-1.5B-Instruct/model.safetensors rename to GRPO/Qwen2.5-1.5B-Instruct/model.safetensors diff --git a/Qwen-grpo/Qwen2.5-1.5B-Instruct/special_tokens_map.json b/GRPO/Qwen2.5-1.5B-Instruct/special_tokens_map.json similarity index 100% rename from Qwen-grpo/Qwen2.5-1.5B-Instruct/special_tokens_map.json rename to GRPO/Qwen2.5-1.5B-Instruct/special_tokens_map.json diff --git a/Qwen-grpo/Qwen2.5-1.5B-Instruct/tokenizer.json b/GRPO/Qwen2.5-1.5B-Instruct/tokenizer.json similarity index 100% rename from Qwen-grpo/Qwen2.5-1.5B-Instruct/tokenizer.json rename to GRPO/Qwen2.5-1.5B-Instruct/tokenizer.json diff --git a/Qwen-grpo/Qwen2.5-1.5B-Instruct/tokenizer_config.json b/GRPO/Qwen2.5-1.5B-Instruct/tokenizer_config.json similarity index 100% rename from Qwen-grpo/Qwen2.5-1.5B-Instruct/tokenizer_config.json rename to GRPO/Qwen2.5-1.5B-Instruct/tokenizer_config.json diff --git a/Qwen-grpo/Qwen2.5-1.5B-Instruct/vocab.json b/GRPO/Qwen2.5-1.5B-Instruct/vocab.json similarity index 100% rename from Qwen-grpo/Qwen2.5-1.5B-Instruct/vocab.json rename to GRPO/Qwen2.5-1.5B-Instruct/vocab.json diff --git a/Qwen-grpo/Qwen2.5-7B-Instruct/added_tokens.json b/GRPO/Qwen2.5-7B-Instruct/added_tokens.json similarity index 100% rename from Qwen-grpo/Qwen2.5-7B-Instruct/added_tokens.json rename to GRPO/Qwen2.5-7B-Instruct/added_tokens.json diff --git a/Qwen-grpo/Qwen2.5-7B-Instruct/chat_template.jinja b/GRPO/Qwen2.5-7B-Instruct/chat_template.jinja similarity index 100% rename from Qwen-grpo/Qwen2.5-7B-Instruct/chat_template.jinja rename to GRPO/Qwen2.5-7B-Instruct/chat_template.jinja diff --git a/Qwen-grpo/Qwen2.5-7B-Instruct/config.json b/GRPO/Qwen2.5-7B-Instruct/config.json similarity index 100% rename from Qwen-grpo/Qwen2.5-7B-Instruct/config.json rename to GRPO/Qwen2.5-7B-Instruct/config.json diff --git a/Qwen-grpo/Qwen2.5-7B-Instruct/generation_config.json b/GRPO/Qwen2.5-7B-Instruct/generation_config.json similarity index 100% rename from Qwen-grpo/Qwen2.5-7B-Instruct/generation_config.json rename to GRPO/Qwen2.5-7B-Instruct/generation_config.json diff --git a/Qwen-grpo/Qwen2.5-7B-Instruct/merges.txt b/GRPO/Qwen2.5-7B-Instruct/merges.txt similarity index 100% rename from Qwen-grpo/Qwen2.5-7B-Instruct/merges.txt rename to GRPO/Qwen2.5-7B-Instruct/merges.txt diff --git a/Qwen-grpo/Qwen2.5-7B-Instruct/model-00001-of-00004.safetensors b/GRPO/Qwen2.5-7B-Instruct/model-00001-of-00004.safetensors similarity index 100% rename from Qwen-grpo/Qwen2.5-7B-Instruct/model-00001-of-00004.safetensors rename to GRPO/Qwen2.5-7B-Instruct/model-00001-of-00004.safetensors diff --git a/Qwen-grpo/Qwen2.5-7B-Instruct/model-00002-of-00004.safetensors b/GRPO/Qwen2.5-7B-Instruct/model-00002-of-00004.safetensors similarity index 100% rename from Qwen-grpo/Qwen2.5-7B-Instruct/model-00002-of-00004.safetensors rename to GRPO/Qwen2.5-7B-Instruct/model-00002-of-00004.safetensors diff --git a/Qwen-grpo/Qwen2.5-7B-Instruct/model-00003-of-00004.safetensors b/GRPO/Qwen2.5-7B-Instruct/model-00003-of-00004.safetensors similarity index 100% rename from Qwen-grpo/Qwen2.5-7B-Instruct/model-00003-of-00004.safetensors rename to GRPO/Qwen2.5-7B-Instruct/model-00003-of-00004.safetensors diff --git a/Qwen-grpo/Qwen2.5-7B-Instruct/model-00004-of-00004.safetensors b/GRPO/Qwen2.5-7B-Instruct/model-00004-of-00004.safetensors similarity index 100% rename from Qwen-grpo/Qwen2.5-7B-Instruct/model-00004-of-00004.safetensors rename to GRPO/Qwen2.5-7B-Instruct/model-00004-of-00004.safetensors diff --git a/Qwen-grpo/Qwen2.5-7B-Instruct/model.safetensors.index.json b/GRPO/Qwen2.5-7B-Instruct/model.safetensors.index.json similarity index 100% rename from Qwen-grpo/Qwen2.5-7B-Instruct/model.safetensors.index.json rename to GRPO/Qwen2.5-7B-Instruct/model.safetensors.index.json diff --git a/Qwen-grpo/Qwen2.5-7B-Instruct/special_tokens_map.json b/GRPO/Qwen2.5-7B-Instruct/special_tokens_map.json similarity index 100% rename from Qwen-grpo/Qwen2.5-7B-Instruct/special_tokens_map.json rename to GRPO/Qwen2.5-7B-Instruct/special_tokens_map.json diff --git a/Qwen-grpo/Qwen2.5-7B-Instruct/tokenizer.json b/GRPO/Qwen2.5-7B-Instruct/tokenizer.json similarity index 100% rename from Qwen-grpo/Qwen2.5-7B-Instruct/tokenizer.json rename to GRPO/Qwen2.5-7B-Instruct/tokenizer.json diff --git a/Qwen-grpo/Qwen2.5-7B-Instruct/tokenizer_config.json b/GRPO/Qwen2.5-7B-Instruct/tokenizer_config.json similarity index 100% rename from Qwen-grpo/Qwen2.5-7B-Instruct/tokenizer_config.json rename to GRPO/Qwen2.5-7B-Instruct/tokenizer_config.json diff --git a/Qwen-grpo/Qwen2.5-7B-Instruct/vocab.json b/GRPO/Qwen2.5-7B-Instruct/vocab.json similarity index 100% rename from Qwen-grpo/Qwen2.5-7B-Instruct/vocab.json rename to GRPO/Qwen2.5-7B-Instruct/vocab.json diff --git a/Qwen-grpo/Qwen3-4B/added_tokens.json b/GRPO/Qwen3-4B/added_tokens.json similarity index 100% rename from Qwen-grpo/Qwen3-4B/added_tokens.json rename to GRPO/Qwen3-4B/added_tokens.json diff --git a/Qwen-grpo/Qwen3-4B/chat_template.jinja b/GRPO/Qwen3-4B/chat_template.jinja similarity index 100% rename from Qwen-grpo/Qwen3-4B/chat_template.jinja rename to GRPO/Qwen3-4B/chat_template.jinja diff --git a/Qwen-grpo/Qwen3-4B/config.json b/GRPO/Qwen3-4B/config.json similarity index 100% rename from Qwen-grpo/Qwen3-4B/config.json rename to GRPO/Qwen3-4B/config.json diff --git a/Qwen-grpo/Qwen3-4B/generation_config.json b/GRPO/Qwen3-4B/generation_config.json similarity index 100% rename from Qwen-grpo/Qwen3-4B/generation_config.json rename to GRPO/Qwen3-4B/generation_config.json diff --git a/Qwen-grpo/Qwen3-4B/merges.txt b/GRPO/Qwen3-4B/merges.txt similarity index 100% rename from Qwen-grpo/Qwen3-4B/merges.txt rename to GRPO/Qwen3-4B/merges.txt diff --git a/Qwen-grpo/Qwen3-4B/model-00001-of-00002.safetensors b/GRPO/Qwen3-4B/model-00001-of-00002.safetensors similarity index 100% rename from Qwen-grpo/Qwen3-4B/model-00001-of-00002.safetensors rename to GRPO/Qwen3-4B/model-00001-of-00002.safetensors diff --git a/Qwen-grpo/Qwen3-4B/model-00002-of-00002.safetensors b/GRPO/Qwen3-4B/model-00002-of-00002.safetensors similarity index 100% rename from Qwen-grpo/Qwen3-4B/model-00002-of-00002.safetensors rename to GRPO/Qwen3-4B/model-00002-of-00002.safetensors diff --git a/Qwen-grpo/Qwen3-4B/model.safetensors.index.json b/GRPO/Qwen3-4B/model.safetensors.index.json similarity index 100% rename from Qwen-grpo/Qwen3-4B/model.safetensors.index.json rename to GRPO/Qwen3-4B/model.safetensors.index.json diff --git a/Qwen-grpo/Qwen3-4B/special_tokens_map.json b/GRPO/Qwen3-4B/special_tokens_map.json similarity index 100% rename from Qwen-grpo/Qwen3-4B/special_tokens_map.json rename to GRPO/Qwen3-4B/special_tokens_map.json diff --git a/Qwen-grpo/Qwen3-4B/tokenizer.json b/GRPO/Qwen3-4B/tokenizer.json similarity index 100% rename from Qwen-grpo/Qwen3-4B/tokenizer.json rename to GRPO/Qwen3-4B/tokenizer.json diff --git a/Qwen-grpo/Qwen3-4B/tokenizer_config.json b/GRPO/Qwen3-4B/tokenizer_config.json similarity index 100% rename from Qwen-grpo/Qwen3-4B/tokenizer_config.json rename to GRPO/Qwen3-4B/tokenizer_config.json diff --git a/Qwen-grpo/Qwen3-4B/vocab.json b/GRPO/Qwen3-4B/vocab.json similarity index 100% rename from Qwen-grpo/Qwen3-4B/vocab.json rename to GRPO/Qwen3-4B/vocab.json diff --git a/Qwen-grpo/Qwen3-8B/added_tokens.json b/GRPO/Qwen3-8B/added_tokens.json similarity index 100% rename from Qwen-grpo/Qwen3-8B/added_tokens.json rename to GRPO/Qwen3-8B/added_tokens.json diff --git a/Qwen-grpo/Qwen3-8B/chat_template.jinja b/GRPO/Qwen3-8B/chat_template.jinja similarity index 100% rename from Qwen-grpo/Qwen3-8B/chat_template.jinja rename to GRPO/Qwen3-8B/chat_template.jinja diff --git a/Qwen-grpo/Qwen3-8B/config.json b/GRPO/Qwen3-8B/config.json similarity index 100% rename from Qwen-grpo/Qwen3-8B/config.json rename to GRPO/Qwen3-8B/config.json diff --git a/Qwen-grpo/Qwen3-8B/generation_config.json b/GRPO/Qwen3-8B/generation_config.json similarity index 100% rename from Qwen-grpo/Qwen3-8B/generation_config.json rename to GRPO/Qwen3-8B/generation_config.json diff --git a/Qwen-grpo/Qwen3-8B/merges.txt b/GRPO/Qwen3-8B/merges.txt similarity index 100% rename from Qwen-grpo/Qwen3-8B/merges.txt rename to GRPO/Qwen3-8B/merges.txt diff --git a/Qwen-grpo/Qwen3-8B/model-00001-of-00004.safetensors b/GRPO/Qwen3-8B/model-00001-of-00004.safetensors similarity index 100% rename from Qwen-grpo/Qwen3-8B/model-00001-of-00004.safetensors rename to GRPO/Qwen3-8B/model-00001-of-00004.safetensors diff --git a/Qwen-grpo/Qwen3-8B/model-00002-of-00004.safetensors b/GRPO/Qwen3-8B/model-00002-of-00004.safetensors similarity index 100% rename from Qwen-grpo/Qwen3-8B/model-00002-of-00004.safetensors rename to GRPO/Qwen3-8B/model-00002-of-00004.safetensors diff --git a/Qwen-grpo/Qwen3-8B/model-00003-of-00004.safetensors b/GRPO/Qwen3-8B/model-00003-of-00004.safetensors similarity index 100% rename from Qwen-grpo/Qwen3-8B/model-00003-of-00004.safetensors rename to GRPO/Qwen3-8B/model-00003-of-00004.safetensors diff --git a/Qwen-grpo/Qwen3-8B/model-00004-of-00004.safetensors b/GRPO/Qwen3-8B/model-00004-of-00004.safetensors similarity index 100% rename from Qwen-grpo/Qwen3-8B/model-00004-of-00004.safetensors rename to GRPO/Qwen3-8B/model-00004-of-00004.safetensors diff --git a/Qwen-grpo/Qwen3-8B/model.safetensors.index.json b/GRPO/Qwen3-8B/model.safetensors.index.json similarity index 100% rename from Qwen-grpo/Qwen3-8B/model.safetensors.index.json rename to GRPO/Qwen3-8B/model.safetensors.index.json diff --git a/Qwen-grpo/Qwen3-8B/special_tokens_map.json b/GRPO/Qwen3-8B/special_tokens_map.json similarity index 100% rename from Qwen-grpo/Qwen3-8B/special_tokens_map.json rename to GRPO/Qwen3-8B/special_tokens_map.json diff --git a/Qwen-grpo/Qwen3-8B/tokenizer.json b/GRPO/Qwen3-8B/tokenizer.json similarity index 100% rename from Qwen-grpo/Qwen3-8B/tokenizer.json rename to GRPO/Qwen3-8B/tokenizer.json diff --git a/Qwen-grpo/Qwen3-8B/tokenizer_config.json b/GRPO/Qwen3-8B/tokenizer_config.json similarity index 100% rename from Qwen-grpo/Qwen3-8B/tokenizer_config.json rename to GRPO/Qwen3-8B/tokenizer_config.json diff --git a/Qwen-grpo/Qwen3-8B/vocab.json b/GRPO/Qwen3-8B/vocab.json similarity index 100% rename from Qwen-grpo/Qwen3-8B/vocab.json rename to GRPO/Qwen3-8B/vocab.json diff --git a/output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen2.5-1.5B-Instruct/Modelfile b/SFT/Qwen2.5-1.5B-Instruct/Modelfile similarity index 100% rename from output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen2.5-1.5B-Instruct/Modelfile rename to SFT/Qwen2.5-1.5B-Instruct/Modelfile diff --git a/output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen2.5-1.5B-Instruct/added_tokens.json b/SFT/Qwen2.5-1.5B-Instruct/added_tokens.json similarity index 100% rename from output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen2.5-1.5B-Instruct/added_tokens.json rename to SFT/Qwen2.5-1.5B-Instruct/added_tokens.json diff --git a/output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen2.5-1.5B-Instruct/chat_template.jinja b/SFT/Qwen2.5-1.5B-Instruct/chat_template.jinja similarity index 100% rename from output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen2.5-1.5B-Instruct/chat_template.jinja rename to SFT/Qwen2.5-1.5B-Instruct/chat_template.jinja diff --git a/output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen2.5-1.5B-Instruct/config.json b/SFT/Qwen2.5-1.5B-Instruct/config.json similarity index 100% rename from output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen2.5-1.5B-Instruct/config.json rename to SFT/Qwen2.5-1.5B-Instruct/config.json diff --git a/output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen2.5-1.5B-Instruct/generation_config.json b/SFT/Qwen2.5-1.5B-Instruct/generation_config.json similarity index 100% rename from output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen2.5-1.5B-Instruct/generation_config.json rename to SFT/Qwen2.5-1.5B-Instruct/generation_config.json diff --git a/output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen2.5-1.5B-Instruct/merges.txt b/SFT/Qwen2.5-1.5B-Instruct/merges.txt similarity index 100% rename from output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen2.5-1.5B-Instruct/merges.txt rename to SFT/Qwen2.5-1.5B-Instruct/merges.txt diff --git a/output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen2.5-1.5B-Instruct/model.safetensors b/SFT/Qwen2.5-1.5B-Instruct/model.safetensors similarity index 100% rename from output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen2.5-1.5B-Instruct/model.safetensors rename to SFT/Qwen2.5-1.5B-Instruct/model.safetensors diff --git a/output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen2.5-1.5B-Instruct/special_tokens_map.json b/SFT/Qwen2.5-1.5B-Instruct/special_tokens_map.json similarity index 100% rename from output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen2.5-1.5B-Instruct/special_tokens_map.json rename to SFT/Qwen2.5-1.5B-Instruct/special_tokens_map.json diff --git a/output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen2.5-1.5B-Instruct/tokenizer.json b/SFT/Qwen2.5-1.5B-Instruct/tokenizer.json similarity index 100% rename from output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen2.5-1.5B-Instruct/tokenizer.json rename to SFT/Qwen2.5-1.5B-Instruct/tokenizer.json diff --git a/output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen2.5-1.5B-Instruct/tokenizer_config.json b/SFT/Qwen2.5-1.5B-Instruct/tokenizer_config.json similarity index 100% rename from output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen2.5-1.5B-Instruct/tokenizer_config.json rename to SFT/Qwen2.5-1.5B-Instruct/tokenizer_config.json diff --git a/output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen2.5-1.5B-Instruct/vocab.json b/SFT/Qwen2.5-1.5B-Instruct/vocab.json similarity index 100% rename from output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen2.5-1.5B-Instruct/vocab.json rename to SFT/Qwen2.5-1.5B-Instruct/vocab.json diff --git a/output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen2.5-7B-Instruct/Modelfile b/SFT/Qwen2.5-7B-Instruct/Modelfile similarity index 100% rename from output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen2.5-7B-Instruct/Modelfile rename to SFT/Qwen2.5-7B-Instruct/Modelfile diff --git a/output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen2.5-7B-Instruct/added_tokens.json b/SFT/Qwen2.5-7B-Instruct/added_tokens.json similarity index 100% rename from output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen2.5-7B-Instruct/added_tokens.json rename to SFT/Qwen2.5-7B-Instruct/added_tokens.json diff --git a/output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen2.5-7B-Instruct/chat_template.jinja b/SFT/Qwen2.5-7B-Instruct/chat_template.jinja similarity index 100% rename from output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen2.5-7B-Instruct/chat_template.jinja rename to SFT/Qwen2.5-7B-Instruct/chat_template.jinja diff --git a/output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen2.5-7B-Instruct/config.json b/SFT/Qwen2.5-7B-Instruct/config.json similarity index 100% rename from output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen2.5-7B-Instruct/config.json rename to SFT/Qwen2.5-7B-Instruct/config.json diff --git a/output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen2.5-7B-Instruct/generation_config.json b/SFT/Qwen2.5-7B-Instruct/generation_config.json similarity index 100% rename from output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen2.5-7B-Instruct/generation_config.json rename to SFT/Qwen2.5-7B-Instruct/generation_config.json diff --git a/output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen2.5-7B-Instruct/merges.txt b/SFT/Qwen2.5-7B-Instruct/merges.txt similarity index 100% rename from output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen2.5-7B-Instruct/merges.txt rename to SFT/Qwen2.5-7B-Instruct/merges.txt diff --git a/output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen2.5-7B-Instruct/model-00001-of-00004.safetensors b/SFT/Qwen2.5-7B-Instruct/model-00001-of-00004.safetensors similarity index 100% rename from output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen2.5-7B-Instruct/model-00001-of-00004.safetensors rename to SFT/Qwen2.5-7B-Instruct/model-00001-of-00004.safetensors diff --git a/output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen2.5-7B-Instruct/model-00002-of-00004.safetensors b/SFT/Qwen2.5-7B-Instruct/model-00002-of-00004.safetensors similarity index 100% rename from output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen2.5-7B-Instruct/model-00002-of-00004.safetensors rename to SFT/Qwen2.5-7B-Instruct/model-00002-of-00004.safetensors diff --git a/output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen2.5-7B-Instruct/model-00003-of-00004.safetensors b/SFT/Qwen2.5-7B-Instruct/model-00003-of-00004.safetensors similarity index 100% rename from output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen2.5-7B-Instruct/model-00003-of-00004.safetensors rename to SFT/Qwen2.5-7B-Instruct/model-00003-of-00004.safetensors diff --git a/output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen2.5-7B-Instruct/model-00004-of-00004.safetensors b/SFT/Qwen2.5-7B-Instruct/model-00004-of-00004.safetensors similarity index 100% rename from output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen2.5-7B-Instruct/model-00004-of-00004.safetensors rename to SFT/Qwen2.5-7B-Instruct/model-00004-of-00004.safetensors diff --git a/output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen2.5-7B-Instruct/model.safetensors.index.json b/SFT/Qwen2.5-7B-Instruct/model.safetensors.index.json similarity index 100% rename from output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen2.5-7B-Instruct/model.safetensors.index.json rename to SFT/Qwen2.5-7B-Instruct/model.safetensors.index.json diff --git a/output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen2.5-7B-Instruct/special_tokens_map.json b/SFT/Qwen2.5-7B-Instruct/special_tokens_map.json similarity index 100% rename from output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen2.5-7B-Instruct/special_tokens_map.json rename to SFT/Qwen2.5-7B-Instruct/special_tokens_map.json diff --git a/output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen2.5-7B-Instruct/tokenizer.json b/SFT/Qwen2.5-7B-Instruct/tokenizer.json similarity index 100% rename from output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen2.5-7B-Instruct/tokenizer.json rename to SFT/Qwen2.5-7B-Instruct/tokenizer.json diff --git a/output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen2.5-7B-Instruct/tokenizer_config.json b/SFT/Qwen2.5-7B-Instruct/tokenizer_config.json similarity index 100% rename from output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen2.5-7B-Instruct/tokenizer_config.json rename to SFT/Qwen2.5-7B-Instruct/tokenizer_config.json diff --git a/output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen2.5-7B-Instruct/vocab.json b/SFT/Qwen2.5-7B-Instruct/vocab.json similarity index 100% rename from output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen2.5-7B-Instruct/vocab.json rename to SFT/Qwen2.5-7B-Instruct/vocab.json diff --git a/output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen3-4B/Modelfile b/SFT/Qwen3-4B/Modelfile similarity index 100% rename from output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen3-4B/Modelfile rename to SFT/Qwen3-4B/Modelfile diff --git a/output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen3-4B/added_tokens.json b/SFT/Qwen3-4B/added_tokens.json similarity index 100% rename from output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen3-4B/added_tokens.json rename to SFT/Qwen3-4B/added_tokens.json diff --git a/output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen3-4B/chat_template.jinja b/SFT/Qwen3-4B/chat_template.jinja similarity index 100% rename from output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen3-4B/chat_template.jinja rename to SFT/Qwen3-4B/chat_template.jinja diff --git a/output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen3-4B/config.json b/SFT/Qwen3-4B/config.json similarity index 100% rename from output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen3-4B/config.json rename to SFT/Qwen3-4B/config.json diff --git a/output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen3-4B/generation_config.json b/SFT/Qwen3-4B/generation_config.json similarity index 100% rename from output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen3-4B/generation_config.json rename to SFT/Qwen3-4B/generation_config.json diff --git a/output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen3-4B/merges.txt b/SFT/Qwen3-4B/merges.txt similarity index 100% rename from output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen3-4B/merges.txt rename to SFT/Qwen3-4B/merges.txt diff --git a/output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen3-4B/model-00001-of-00002.safetensors b/SFT/Qwen3-4B/model-00001-of-00002.safetensors similarity index 100% rename from output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen3-4B/model-00001-of-00002.safetensors rename to SFT/Qwen3-4B/model-00001-of-00002.safetensors diff --git a/output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen3-4B/model-00002-of-00002.safetensors b/SFT/Qwen3-4B/model-00002-of-00002.safetensors similarity index 100% rename from output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen3-4B/model-00002-of-00002.safetensors rename to SFT/Qwen3-4B/model-00002-of-00002.safetensors diff --git a/output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen3-4B/model.safetensors.index.json b/SFT/Qwen3-4B/model.safetensors.index.json similarity index 100% rename from output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen3-4B/model.safetensors.index.json rename to SFT/Qwen3-4B/model.safetensors.index.json diff --git a/output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen3-4B/special_tokens_map.json b/SFT/Qwen3-4B/special_tokens_map.json similarity index 100% rename from output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen3-4B/special_tokens_map.json rename to SFT/Qwen3-4B/special_tokens_map.json diff --git a/output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen3-4B/tokenizer.json b/SFT/Qwen3-4B/tokenizer.json similarity index 100% rename from output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen3-4B/tokenizer.json rename to SFT/Qwen3-4B/tokenizer.json diff --git a/output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen3-4B/tokenizer_config.json b/SFT/Qwen3-4B/tokenizer_config.json similarity index 100% rename from output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen3-4B/tokenizer_config.json rename to SFT/Qwen3-4B/tokenizer_config.json diff --git a/output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen3-4B/vocab.json b/SFT/Qwen3-4B/vocab.json similarity index 100% rename from output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen3-4B/vocab.json rename to SFT/Qwen3-4B/vocab.json diff --git a/output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen3-8B/Modelfile b/SFT/Qwen3-8B/Modelfile similarity index 100% rename from output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen3-8B/Modelfile rename to SFT/Qwen3-8B/Modelfile diff --git a/output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen3-8B/added_tokens.json b/SFT/Qwen3-8B/added_tokens.json similarity index 100% rename from output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen3-8B/added_tokens.json rename to SFT/Qwen3-8B/added_tokens.json diff --git a/output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen3-8B/chat_template.jinja b/SFT/Qwen3-8B/chat_template.jinja similarity index 100% rename from output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen3-8B/chat_template.jinja rename to SFT/Qwen3-8B/chat_template.jinja diff --git a/output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen3-8B/config.json b/SFT/Qwen3-8B/config.json similarity index 100% rename from output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen3-8B/config.json rename to SFT/Qwen3-8B/config.json diff --git a/output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen3-8B/generation_config.json b/SFT/Qwen3-8B/generation_config.json similarity index 100% rename from output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen3-8B/generation_config.json rename to SFT/Qwen3-8B/generation_config.json diff --git a/output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen3-8B/merges.txt b/SFT/Qwen3-8B/merges.txt similarity index 100% rename from output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen3-8B/merges.txt rename to SFT/Qwen3-8B/merges.txt diff --git a/output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen3-8B/model-00001-of-00004.safetensors b/SFT/Qwen3-8B/model-00001-of-00004.safetensors similarity index 100% rename from output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen3-8B/model-00001-of-00004.safetensors rename to SFT/Qwen3-8B/model-00001-of-00004.safetensors diff --git a/output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen3-8B/model-00002-of-00004.safetensors b/SFT/Qwen3-8B/model-00002-of-00004.safetensors similarity index 100% rename from output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen3-8B/model-00002-of-00004.safetensors rename to SFT/Qwen3-8B/model-00002-of-00004.safetensors diff --git a/output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen3-8B/model-00003-of-00004.safetensors b/SFT/Qwen3-8B/model-00003-of-00004.safetensors similarity index 100% rename from output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen3-8B/model-00003-of-00004.safetensors rename to SFT/Qwen3-8B/model-00003-of-00004.safetensors diff --git a/output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen3-8B/model-00004-of-00004.safetensors b/SFT/Qwen3-8B/model-00004-of-00004.safetensors similarity index 100% rename from output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen3-8B/model-00004-of-00004.safetensors rename to SFT/Qwen3-8B/model-00004-of-00004.safetensors diff --git a/output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen3-8B/model.safetensors.index.json b/SFT/Qwen3-8B/model.safetensors.index.json similarity index 100% rename from output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen3-8B/model.safetensors.index.json rename to SFT/Qwen3-8B/model.safetensors.index.json diff --git a/output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen3-8B/special_tokens_map.json b/SFT/Qwen3-8B/special_tokens_map.json similarity index 100% rename from output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen3-8B/special_tokens_map.json rename to SFT/Qwen3-8B/special_tokens_map.json diff --git a/output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen3-8B/tokenizer.json b/SFT/Qwen3-8B/tokenizer.json similarity index 100% rename from output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen3-8B/tokenizer.json rename to SFT/Qwen3-8B/tokenizer.json diff --git a/output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen3-8B/tokenizer_config.json b/SFT/Qwen3-8B/tokenizer_config.json similarity index 100% rename from output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen3-8B/tokenizer_config.json rename to SFT/Qwen3-8B/tokenizer_config.json diff --git a/output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen3-8B/vocab.json b/SFT/Qwen3-8B/vocab.json similarity index 100% rename from output-sft-no-format-1016-2/output-sft-no-format-1016-2/Qwen3-8B/vocab.json rename to SFT/Qwen3-8B/vocab.json