prune global_step_40 (keep only latest global_step_48) a5ce848 verified williamium commited on 13 days ago
prune global_step_30 (keep only latest global_step_48) c73fbef verified williamium commited on 13 days ago
prune global_step_20 (keep only latest global_step_48) 1811d60 verified williamium commited on 13 days ago
prune global_step_10 (keep only latest global_step_48) 52b0b5d verified williamium commited on 13 days ago
add sft_7b_gpt_llava_r8_2ep (sft_qwen2.5vl7b_gpt_llava_rephrase8_2ep) 35dbf3c verified williamium commited on 17 days ago
add sft_7b_gpt_llava_mp_2ep (sft_qwen2.5vl7b_gpt_llava_multiprompt_2ep) 4b5fcc2 verified williamium commited on 17 days ago
add sft_7b_gpt_mixfv_r8_2ep (sft_qwen2.5vl7b_gpt_mixfv_rephrase8_2ep) cae10bb verified williamium commited on 17 days ago
add sft_3b_gpt_llava_r8_2ep (sft_qwen2.5vl3b_gpt_llava_rephrase8_2ep) a4e9b24 verified williamium commited on 17 days ago
add sft_3b_gpt_mixfv_r8_2ep (sft_qwen2.5vl3b_gpt_mixfv_rephrase8_2ep) f9e4d2f verified williamium commited on 17 days ago
add sft_3b_gpt_llava_mp_2ep (sft_qwen2.5vl3b_gpt_llava_multiprompt_2ep) 28c75c3 verified williamium commited on 17 days ago
add sft_7b_gpt_mp_mixfv_2ep (sft_qwen2.5vl7b_gpt_mixfv_multiprompt_2ep) 0122f47 verified williamium commited on 20 days ago
add sft_7b_gpt_mp_mixfv_1ep (sft_qwen2.5vl7b_gpt_mixfv_multiprompt_1ep) 0f5050c verified williamium commited on 20 days ago
add sft_7b_gpt_mp_mixfv (sft_qwen2.5vl7b_gpt_mixfv_multiprompt) f776782 verified williamium commited on 20 days ago
add sft_3b_gpt_mp_mixfv_2ep (sft_qwen2.5vl3b_gpt_mixfv_multiprompt_2ep) dde61d9 verified williamium commited on 20 days ago
add v15_3b_sft_mp_mixfv (sft_qwen2.5vl3b_gpt_mixfv_multiprompt) 63f351b verified williamium commited on 20 days ago
add v12_3b_lpan_orig (grpo_Qwen2.5-VL-3B-Instruct_tr1024_mini256_micro32_n8_lr5e-6_cosine_ep1_len-pan-max-256) fd4bdbb verified williamium commited on 22 days ago
add v11_3b_gate_mp_mixfv (grpo_Qwen2.5-VL-3B-Instruct_tr1024_mini256_micro32_n8_lr5e-6_cosine_ep1_gate_v5_multiprompt_mixfv) b2431c9 verified williamium commited on 22 days ago
add v10_3b_lpan_fv (grpo_Qwen2.5-VL-3B-Instruct_tr1024_mini256_micro32_n8_lr5e-6_cosine_ep1_len-pan-max-256_finevision) 83f35cd verified williamium commited on 23 days ago
add v9_3b_lpan_t384s5c10 (grpo_Qwen2.5-VL-3B-Instruct_tr1024_mini256_micro32_n8_lr5e-6_cosine_ep1_lpan_t384_s5_c10) e8501b0 verified williamium commited on 24 days ago
add v8_3b_lpan_t128s10c20 (grpo_Qwen2.5-VL-3B-Instruct_tr1024_mini256_micro32_n8_lr5e-6_cosine_ep1_lpan_t128_s10_c20) c4dcdcd verified williamium commited on 24 days ago
add v7_3b_gate_v5 (grpo_Qwen2.5-VL-3B-Instruct_tr1024_mini256_micro32_n8_lr5e-6_cosine_ep1_gate_v5) 31837c0 verified williamium commited on 24 days ago
add v4_3b_lpan_mixfv (grpo_Qwen2.5-VL-3B-Instruct_tr1024_mini256_micro32_n8_lr5e-6_cosine_ep1_len-pan-max-256_mixfinevision) 846002d verified williamium commited on 25 days ago
add v6_3b_lpan_s20c40 (grpo_Qwen2.5-VL-3B-Instruct_tr1024_mini256_micro32_n8_lr5e-6_cosine_ep1_lpan_t256_s20_c40) ec16c04 verified williamium commited on 26 days ago
add 3B ep3 (grpo_Qwen2.5-VL-3B-Instruct_tr1024_mini256_micro32_n8_lr5e-6_cosine_ep3) global_step_144 9f6df90 verified williamium commited on 26 days ago
Add training code for grpo_Qwen2.5-VL-7B-Instruct_tr1024_mini256_micro16_n8_lr5e-6_cosine_ep1_len-pan-max-256_mixfinevision 2c7a436 verified williamium commited on 27 days ago
add v4_7b_lpan_mixfv merged ckpt (global_step_48) 621ddfc verified williamium commited on 27 days ago
Move ckpt48 merged HF files into grpo_Qwen2.5-VL-7B-Instruct_tr1024_mini256_micro16_n8_lr5e-6_cosine_ep1_len-pan-max-256/global_step_48/ (identify the run) e5d682b verified williamium commited on May 24