diff --git a/.gitattributes b/.gitattributes index db648d43567b124bfd765d61e8151032353f9a89..3fc552b0f8901ca15a6aee1b079369ae0f89aecc 100644 --- a/.gitattributes +++ b/.gitattributes @@ -72,3 +72,6 @@ legacy/video_mllm_swift/s1_declip_siglip2_qwen3_1.7b/v0-20260314-141147/checkpoi legacy/video_mllm_swift/s1_siglip2_qwen3_1.7b/v11-20260314-090153/checkpoint-2000/tokenizer.json filter=lfs diff=lfs merge=lfs -text legacy/video_mllm_swift/s1_siglip2_qwen3_1.7b/v11-20260314-090153/checkpoint-2181/tokenizer.json filter=lfs diff=lfs merge=lfs -text legacy/video_mllm_swift/s2_declip_siglip2_qwen3_1.7b_10pct/checkpoint-1000/tokenizer.json filter=lfs diff=lfs merge=lfs -text +legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-300/tokenizer.json filter=lfs diff=lfs merge=lfs -text +legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/tokenizer.json filter=lfs diff=lfs merge=lfs -text +legacy/video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/tokenizer.json filter=lfs diff=lfs merge=lfs -text diff --git a/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-300/global_step300/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt b/legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-300/global_step300/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt similarity index 100% rename from video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-300/global_step300/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt rename to legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-300/global_step300/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt diff --git a/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-300/global_step300/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt b/legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-300/global_step300/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt similarity index 100% rename from video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-300/global_step300/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt rename to legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-300/global_step300/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt diff --git a/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-300/global_step300/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt b/legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-300/global_step300/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt similarity index 100% rename from video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-300/global_step300/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt rename to legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-300/global_step300/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt diff --git a/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-300/global_step300/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt b/legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-300/global_step300/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt similarity index 100% rename from video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-300/global_step300/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt rename to legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-300/global_step300/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt diff --git a/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-300/global_step300/mp_rank_00_model_states.pt b/legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-300/global_step300/mp_rank_00_model_states.pt similarity index 100% rename from video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-300/global_step300/mp_rank_00_model_states.pt rename to legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-300/global_step300/mp_rank_00_model_states.pt diff --git a/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-300/latest b/legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-300/latest similarity index 100% rename from video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-300/latest rename to legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-300/latest diff --git a/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-300/model.safetensors b/legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-300/model.safetensors similarity index 100% rename from video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-300/model.safetensors rename to legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-300/model.safetensors diff --git a/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-300/processor_config.json b/legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-300/processor_config.json similarity index 100% rename from video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-300/processor_config.json rename to legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-300/processor_config.json diff --git a/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-300/rng_state_0.pth b/legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-300/rng_state_0.pth similarity index 100% rename from video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-300/rng_state_0.pth rename to legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-300/rng_state_0.pth diff --git a/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-300/rng_state_1.pth b/legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-300/rng_state_1.pth similarity index 100% rename from video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-300/rng_state_1.pth rename to legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-300/rng_state_1.pth diff --git a/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-300/rng_state_2.pth b/legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-300/rng_state_2.pth similarity index 100% rename from video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-300/rng_state_2.pth rename to legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-300/rng_state_2.pth diff --git a/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-300/rng_state_3.pth b/legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-300/rng_state_3.pth similarity index 100% rename from video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-300/rng_state_3.pth rename to legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-300/rng_state_3.pth diff --git a/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-300/rng_state_4.pth b/legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-300/rng_state_4.pth similarity index 100% rename from video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-300/rng_state_4.pth rename to legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-300/rng_state_4.pth diff --git a/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-300/rng_state_5.pth b/legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-300/rng_state_5.pth similarity index 100% rename from video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-300/rng_state_5.pth rename to legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-300/rng_state_5.pth diff --git a/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-300/rng_state_6.pth b/legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-300/rng_state_6.pth similarity index 100% rename from video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-300/rng_state_6.pth rename to legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-300/rng_state_6.pth diff --git a/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-300/rng_state_7.pth b/legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-300/rng_state_7.pth similarity index 100% rename from video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-300/rng_state_7.pth rename to legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-300/rng_state_7.pth diff --git a/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-300/scheduler.pt b/legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-300/scheduler.pt similarity index 100% rename from video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-300/scheduler.pt rename to legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-300/scheduler.pt diff --git a/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-300/tokenizer.json b/legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-300/tokenizer.json similarity index 100% rename from video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-300/tokenizer.json rename to legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-300/tokenizer.json diff --git a/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-300/tokenizer_config.json b/legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-300/tokenizer_config.json similarity index 100% rename from video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-300/tokenizer_config.json rename to legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-300/tokenizer_config.json diff --git a/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-300/trainer_state.json b/legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-300/trainer_state.json similarity index 100% rename from video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-300/trainer_state.json rename to legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-300/trainer_state.json diff --git a/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-300/training_args.bin b/legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-300/training_args.bin similarity index 100% rename from video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-300/training_args.bin rename to legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-300/training_args.bin diff --git a/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-300/zero_to_fp32.py b/legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-300/zero_to_fp32.py similarity index 100% rename from video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-300/zero_to_fp32.py rename to legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-300/zero_to_fp32.py diff --git a/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/args.json b/legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/args.json similarity index 100% rename from video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/args.json rename to legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/args.json diff --git a/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/chat_template.jinja b/legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/chat_template.jinja similarity index 100% rename from video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/chat_template.jinja rename to legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/chat_template.jinja diff --git a/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/config.json b/legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/config.json similarity index 100% rename from video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/config.json rename to legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/config.json diff --git a/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/generation_config.json b/legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/generation_config.json similarity index 100% rename from video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/generation_config.json rename to legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/generation_config.json diff --git a/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/global_step400/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/global_step400/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt similarity index 100% rename from video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/global_step400/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt rename to legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/global_step400/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt diff --git a/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/global_step400/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/global_step400/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt similarity index 100% rename from video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/global_step400/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt rename to legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/global_step400/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt diff --git a/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/global_step400/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/global_step400/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt similarity index 100% rename from video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/global_step400/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt rename to legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/global_step400/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt diff --git a/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/global_step400/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/global_step400/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt similarity index 100% rename from video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/global_step400/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt rename to legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/global_step400/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt diff --git a/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/global_step400/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt b/legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/global_step400/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt similarity index 100% rename from video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/global_step400/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt rename to legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/global_step400/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt diff --git a/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/global_step400/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt b/legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/global_step400/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt similarity index 100% rename from video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/global_step400/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt rename to legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/global_step400/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt diff --git a/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/global_step400/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt b/legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/global_step400/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt similarity index 100% rename from video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/global_step400/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt rename to legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/global_step400/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt diff --git a/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/global_step400/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt b/legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/global_step400/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt similarity index 100% rename from video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/global_step400/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt rename to legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/global_step400/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt diff --git a/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/global_step400/mp_rank_00_model_states.pt b/legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/global_step400/mp_rank_00_model_states.pt similarity index 100% rename from video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/global_step400/mp_rank_00_model_states.pt rename to legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/global_step400/mp_rank_00_model_states.pt diff --git a/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/latest b/legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/latest similarity index 100% rename from video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/latest rename to legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/latest diff --git a/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/model.safetensors b/legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/model.safetensors similarity index 100% rename from video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/model.safetensors rename to legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/model.safetensors diff --git a/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/processor_config.json b/legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/processor_config.json similarity index 100% rename from video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/processor_config.json rename to legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/processor_config.json diff --git a/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/rng_state_0.pth b/legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/rng_state_0.pth similarity index 100% rename from video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/rng_state_0.pth rename to legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/rng_state_0.pth diff --git a/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/rng_state_1.pth b/legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/rng_state_1.pth similarity index 100% rename from video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/rng_state_1.pth rename to legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/rng_state_1.pth diff --git a/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/rng_state_2.pth b/legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/rng_state_2.pth similarity index 100% rename from video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/rng_state_2.pth rename to legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/rng_state_2.pth diff --git a/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/rng_state_4.pth b/legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/rng_state_4.pth similarity index 100% rename from video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/rng_state_4.pth rename to legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/rng_state_4.pth diff --git a/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/rng_state_5.pth b/legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/rng_state_5.pth similarity index 100% rename from video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/rng_state_5.pth rename to legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/rng_state_5.pth diff --git a/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/rng_state_7.pth b/legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/rng_state_7.pth similarity index 100% rename from video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/rng_state_7.pth rename to legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/rng_state_7.pth diff --git a/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/scheduler.pt b/legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/scheduler.pt similarity index 100% rename from video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/scheduler.pt rename to legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/scheduler.pt diff --git a/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/tokenizer.json b/legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/tokenizer.json similarity index 100% rename from video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/tokenizer.json rename to legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/tokenizer.json diff --git a/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/tokenizer_config.json b/legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/tokenizer_config.json similarity index 100% rename from video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/tokenizer_config.json rename to legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/tokenizer_config.json diff --git a/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/trainer_state.json b/legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/trainer_state.json similarity index 100% rename from video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/trainer_state.json rename to legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/trainer_state.json diff --git a/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/training_args.bin b/legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/training_args.bin similarity index 100% rename from video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/training_args.bin rename to legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/training_args.bin diff --git a/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/zero_to_fp32.py b/legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/zero_to_fp32.py similarity index 100% rename from video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/zero_to_fp32.py rename to legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/checkpoint-400/zero_to_fp32.py diff --git a/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/logging.jsonl b/legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/logging.jsonl similarity index 100% rename from video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/logging.jsonl rename to legacy/video_mllm_swift/s2_image_only_10pct/v1-20260316-135215/logging.jsonl diff --git a/video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/args.json b/legacy/video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/args.json similarity index 100% rename from video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/args.json rename to legacy/video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/args.json diff --git a/video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/args.json b/legacy/video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/args.json similarity index 100% rename from video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/args.json rename to legacy/video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/args.json diff --git a/video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/chat_template.jinja b/legacy/video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/chat_template.jinja similarity index 100% rename from video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/chat_template.jinja rename to legacy/video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/chat_template.jinja diff --git a/video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/config.json b/legacy/video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/config.json similarity index 100% rename from video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/config.json rename to legacy/video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/config.json diff --git a/video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/generation_config.json b/legacy/video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/generation_config.json similarity index 100% rename from video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/generation_config.json rename to legacy/video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/generation_config.json diff --git a/video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/global_step900/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/legacy/video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/global_step900/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt similarity index 100% rename from video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/global_step900/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt rename to legacy/video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/global_step900/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt diff --git a/video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/global_step900/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/legacy/video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/global_step900/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt similarity index 100% rename from video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/global_step900/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt rename to legacy/video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/global_step900/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt diff --git a/video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/global_step900/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/legacy/video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/global_step900/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt similarity index 100% rename from video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/global_step900/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt rename to legacy/video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/global_step900/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt diff --git a/video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/global_step900/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/legacy/video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/global_step900/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt similarity index 100% rename from video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/global_step900/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt rename to legacy/video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/global_step900/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt diff --git a/video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/global_step900/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt b/legacy/video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/global_step900/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt similarity index 100% rename from video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/global_step900/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt rename to legacy/video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/global_step900/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt diff --git a/video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/global_step900/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt b/legacy/video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/global_step900/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt similarity index 100% rename from video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/global_step900/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt rename to legacy/video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/global_step900/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt diff --git a/video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/global_step900/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt b/legacy/video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/global_step900/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt similarity index 100% rename from video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/global_step900/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt rename to legacy/video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/global_step900/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt diff --git a/video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/global_step900/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt b/legacy/video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/global_step900/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt similarity index 100% rename from video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/global_step900/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt rename to legacy/video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/global_step900/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt diff --git a/video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/global_step900/mp_rank_00_model_states.pt b/legacy/video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/global_step900/mp_rank_00_model_states.pt similarity index 100% rename from video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/global_step900/mp_rank_00_model_states.pt rename to legacy/video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/global_step900/mp_rank_00_model_states.pt diff --git a/video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/latest b/legacy/video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/latest similarity index 100% rename from video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/latest rename to legacy/video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/latest diff --git a/video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/model.safetensors b/legacy/video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/model.safetensors similarity index 100% rename from video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/model.safetensors rename to legacy/video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/model.safetensors diff --git a/video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/processor_config.json b/legacy/video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/processor_config.json similarity index 100% rename from video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/processor_config.json rename to legacy/video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/processor_config.json diff --git a/video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/rng_state_0.pth b/legacy/video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/rng_state_0.pth similarity index 100% rename from video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/rng_state_0.pth rename to legacy/video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/rng_state_0.pth diff --git a/video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/rng_state_1.pth b/legacy/video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/rng_state_1.pth similarity index 100% rename from video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/rng_state_1.pth rename to legacy/video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/rng_state_1.pth diff --git a/video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/rng_state_2.pth b/legacy/video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/rng_state_2.pth similarity index 100% rename from video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/rng_state_2.pth rename to legacy/video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/rng_state_2.pth diff --git a/video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/rng_state_3.pth b/legacy/video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/rng_state_3.pth similarity index 100% rename from video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/rng_state_3.pth rename to legacy/video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/rng_state_3.pth diff --git a/video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/rng_state_4.pth b/legacy/video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/rng_state_4.pth similarity index 100% rename from video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/rng_state_4.pth rename to legacy/video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/rng_state_4.pth diff --git a/video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/rng_state_5.pth b/legacy/video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/rng_state_5.pth similarity index 100% rename from video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/rng_state_5.pth rename to legacy/video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/rng_state_5.pth diff --git a/video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/rng_state_6.pth b/legacy/video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/rng_state_6.pth similarity index 100% rename from video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/rng_state_6.pth rename to legacy/video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/rng_state_6.pth diff --git a/video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/rng_state_7.pth b/legacy/video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/rng_state_7.pth similarity index 100% rename from video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/rng_state_7.pth rename to legacy/video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/rng_state_7.pth diff --git a/video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/scheduler.pt b/legacy/video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/scheduler.pt similarity index 100% rename from video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/scheduler.pt rename to legacy/video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/scheduler.pt diff --git a/video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/tokenizer.json b/legacy/video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/tokenizer.json similarity index 100% rename from video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/tokenizer.json rename to legacy/video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/tokenizer.json diff --git a/video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/tokenizer_config.json b/legacy/video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/tokenizer_config.json similarity index 100% rename from video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/tokenizer_config.json rename to legacy/video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/tokenizer_config.json diff --git a/video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/trainer_state.json b/legacy/video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/trainer_state.json similarity index 100% rename from video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/trainer_state.json rename to legacy/video_mllm_swift/s2_siglip2_qwen3_1.7b_10pct/checkpoint-900/trainer_state.json