modrill/rl_math_rl_ready_models_0444_global_step_285_hf Text Generation • 4B • Updated 8 days ago • 14
modrill/math_think_11_qwen3_4b_base_task_arithmetic_scaling_0_9 Text Generation • 4B • Updated 9 days ago • 44
modrill/math_think_11_qwen3_4b_base_task_arithmetic_scaling_0_8 Text Generation • 4B • Updated 9 days ago • 75 •
modrill/math_think_11_qwen3_4b_base_task_arithmetic_scaling_0_7 Text Generation • 4B • Updated 9 days ago • 45
modrill/math_think_11_qwen3_4b_base_task_arithmetic_scaling_0_6 Text Generation • 4B • Updated 9 days ago • 73 •
modrill/math_think_11_qwen3_4b_base_task_arithmetic_scaling_0_5 Text Generation • 4B • Updated 9 days ago • 47
modrill/math_think_11_qwen3_4b_base_task_arithmetic_scaling_0_4 Text Generation • 4B • Updated 9 days ago • 47
modrill/math_think_11_qwen3_4b_base_task_arithmetic_scaling_0_3 Text Generation • 4B • Updated 9 days ago • 112 •
modrill/math_think_11_qwen3_4b_base_task_arithmetic_scaling_0_2 Text Generation • 4B • Updated 9 days ago • 137 •
modrill/math_think_11_qwen3_4b_base_task_arithmetic_scaling_0_1 Text Generation • 4B • Updated 9 days ago • 182 •
modrill/math_no_think_17_qwen3_4b_base_sft_dataless_ls Text Generation • 4B • Updated 9 days ago • 216 •
modrill/lingcoder_shortcot_merged_fixed200k_4k_qwen3_4b_instruct2507 Text Generation • 4B • Updated 10 days ago • 103 •
modrill/lingcoder_shortcot_fixed200k_lora_qwen3_4b_instruct2507 Text Generation • Updated 10 days ago
modrill/kodcode4o_easy_conv_fixed50k_4k_merged_qwen3_4b_instruct2507 Text Generation • 4B • Updated 10 days ago • 99 •
modrill/kodcode4o_hard_conv_fixed42k_4k_merged_qwen3_4b_instruct2507 Text Generation • 4B • Updated 10 days ago • 49
modrill/kodcode4o_hard_conv_fixed42k_4k_lora_qwen3_4b_instruct2507 Text Generation • Updated 10 days ago
modrill/kodcode4o_easy_conv_fixed50k_4k_lora_qwen3_4b_instruct2507 Text Generation • Updated 10 days ago
modrill/kodcode4o_medium_conv_fixed50k_4k_lora_qwen3_4b_instruct2507 Text Generation • Updated 10 days ago