passing2961/finch_8b_kto_held_out_expr_purpose_qwen_max16384_kto_5.0e-7_1.0_train42_cosine Text Generation • 8B • Updated about 20 hours ago • 25
passing2961/finch_27b_hard_without_held_out_expr_purpose_qwen_1.0e-5_1.0_train42_cosine Image-Text-to-Text • 3.05M • Updated 1 day ago • 11
passing2961/finch_4b_kto_held_out_expr_purpose_qwen_max8192_kto_5.0e-7_1.0_train42_cosine Image-Text-to-Text • 5B • Updated 2 days ago • 179
passing2961/finch_8b_soft_with_held_out_expr_purpose_qwen_1.0e-5_1.0_train42_cosine Text Generation • 8B • Updated 2 days ago • 9
passing2961/finch_4b_soft_without_held_out_expr_purpose_qwen_1.0e-5_1.0_train42_cosine Image-Text-to-Text • 5B • Updated 2 days ago • 11
passing2961/finch_4b_hard_without_held_out_expr_purpose_qwen_1.0e-5_1.0_train42_cosine Image-Text-to-Text • 5B • Updated 2 days ago • 447
passing2961/finch_8b_soft_without_held_out_expr_purpose_qwen_1.0e-5_1.0_train42_cosine Text Generation • 8B • Updated 2 days ago • 104
passing2961/finch_8b_hard_with_held_out_expr_purpose_qwen_1.0e-5_1.0_train42_cosine Text Generation • 8B • Updated 2 days ago • 13
passing2961/finch_9b_soft_without_held_out_expr_purpose_qwen_1.0e-5_1.0_train42_cosine Image-Text-to-Text • 9B • Updated 2 days ago • 47
passing2961/finch_8b_hard_without_held_out_expr_purpose_qwen_1.0e-5_1.0_train42_cosine Text Generation • 8B • Updated 2 days ago • 2.15k
passing2961/finch_2b_soft_without_held_out_expr_purpose_qwen_1.0e-5_1.0_train42_cosine Image-Text-to-Text • 3B • Updated 2 days ago • 10
passing2961/finch_9b_hard_without_held_out_expr_purpose_qwen_1.0e-5_1.0_train42_cosine Image-Text-to-Text • 9B • Updated 2 days ago • 86
passing2961/finch_2b_hard_without_held_out_expr_purpose_qwen_1.0e-5_1.0_train42_cosine Image-Text-to-Text • 3B • Updated 3 days ago • 13
passing2961/qwen3_5_9b_finch_all_local_hard_with_held_out_expr_purpose_qwen_1.0e-5_1.0_train42_cosine Image-Text-to-Text • 9B • Updated 3 days ago • 12
passing2961/qwen3_5_9b_finch_all_local_hard_without_held_out_expr_purpose_qwen_1.0e-5_1.0_train42_cosine Image-Text-to-Text • 9B • Updated 3 days ago • 86
passing2961/qwen3_8b_finch_all_local_soft_without_held_out_expr_purpose_qwen_1.0e-5_1.0_train42_cosine Text Generation • 8B • Updated 3 days ago • 2.66k
passing2961/qwen3_5_9b_finch_all_local_soft_without_held_out_expr_purpose_qwen_1.0e-5_1.0_train42_cosine Image-Text-to-Text • 9B • Updated 4 days ago • 270
passing2961/qwen3_5_4b_finch_all_local_hard_without_held_out_expr_purpose_1.0e-5_1.0_train42_cosine Image-Text-to-Text • 5B • Updated 4 days ago • 16
passing2961/qwen3_5_2b_finch_all_local_hard_without_held_out_expr_purpose_1.0e-5_2.0_train42_cosine Image-Text-to-Text • 3B • Updated 4 days ago • 46
passing2961/qwen3_5_2b_finch_all_local_hard_without_held_out_expr_purpose_qwen_1.0e-5_1.0_train42_cosine Image-Text-to-Text • 3B • Updated 4 days ago • 16
passing2961/qwen3_8b_finch_all_local_hard_without_held_out_expr_purpose_qwen_1.0e-5_1.0_train42_cosine Text Generation • 8B • Updated 4 days ago • 2.86k
passing2961/qwen3_8b_finch_all_local_hard_without_held_out_expr_purpose_1.0e-5_2.0_train42_cosine Text Generation • 8B • Updated 5 days ago • 211
passing2961/qwen3_8b_finch_187_tasks_expr_purpose_1.0e-5_2.0_train42_cosine Text Generation • 8B • Updated 5 days ago • 12
passing2961/qwen3_0_6b_finch_all_local_hard_expr_purpose_1.0e-5_2.0_train42_cosine 0.8B • Updated 6 days ago • 12
passing2961/qwen3_8b_finch_math_optimization_local_quality_hard_expr_purpose_1.0e-5_2.0_train42_cosine Text Generation • 8B • Updated 6 days ago • 24