xinpeng/big-math-hard-tiny-qwen2.5-3b-instruct-og-rloo-implicit-cheat-direct-global_step_105 3B • Updated Sep 8, 2025
xinpeng/big-math-hard-tiny-qwen2.5-3b-instruct-og-rloo-implicit-cheat-direct-global_step_110 3B • Updated Sep 8, 2025
xinpeng/big-math-hard-tiny-qwen2.5-3b-instruct-og-rloo-implicit-cheat-direct-global_step_115 3B • Updated Sep 8, 2025
xinpeng/big-math-hard-tiny-qwen2.5-3b-instruct-og-rloo-implicit-cheat-direct-global_step_100 3B • Updated Sep 8, 2025
xinpeng/big-math-hard-tiny-qwen2.5-3b-instruct-og-rloo-implicit-cheat-direct-global_step_90 3B • Updated Sep 8, 2025
xinpeng/big-math-hard-tiny-qwen2.5-3b-instruct-og-rloo-implicit-cheat-direct-global_step_95 3B • Updated Sep 8, 2025
xinpeng/big-math-hard-tiny-qwen2.5-3b-instruct-og-rloo-implicit-cheat-direct-global_step_85 3B • Updated Sep 8, 2025
xinpeng/big-math-hard-tiny-qwen2.5-3b-instruct-og-rloo-implicit-cheat-direct-global_step_35 3B • Updated Sep 8, 2025
xinpeng/big-math-hard-tiny-qwen2.5-3b-instruct-og-rloo-implicit-cheat-direct-global_step_80 3B • Updated Sep 8, 2025
xinpeng/big-math-hard-tiny-qwen2.5-3b-instruct-og-rloo-implicit-cheat-direct-global_step_5 3B • Updated Sep 8, 2025 • 3
xinpeng/big-math-hard-tiny-qwen2.5-3b-instruct-og-rloo-implicit-cheat-direct-global_step_20 3B • Updated Sep 8, 2025 • 24
xinpeng/big-math-hard-tiny-qwen2.5-3b-instruct-og-rloo-implicit-cheat-direct-global_step_10 3B • Updated Sep 8, 2025 • 1.94k
xinpeng/big-math-hard-tiny-qwen2.5-3b-instruct-og-rloo-implicit-cheat-direct-global_step_75 3B • Updated Sep 8, 2025
xinpeng/big-math-hard-tiny-qwen2.5-3b-instruct-og-rloo-implicit-cheat-direct-global_step_70 3B • Updated Sep 8, 2025
xinpeng/big-math-hard-tiny-qwen2.5-3b-instruct-og-rloo-implicit-cheat-direct-global_step_65 3B • Updated Sep 8, 2025
xinpeng/big-math-hard-tiny-qwen2.5-3b-instruct-og-rloo-implicit-cheat-direct-global_step_50 3B • Updated Sep 8, 2025
xinpeng/big-math-hard-tiny-qwen2.5-3b-instruct-og-rloo-implicit-cheat-direct-global_step_25 3B • Updated Sep 8, 2025 • 26
xinpeng/big-math-hard-tiny-qwen2.5-3b-instruct-og-rloo-implicit-cheat-direct-global_step_55 3B • Updated Sep 8, 2025
xinpeng/big-math-hard-tiny-qwen2.5-3b-instruct-og-rloo-implicit-cheat-direct-global_step_40 3B • Updated Sep 8, 2025
xinpeng/big-math-hard-tiny-qwen2.5-3b-instruct-og-rloo-implicit-cheat-direct-global_step_60 3B • Updated Sep 8, 2025
xinpeng/big-math-hard-tiny-qwen2.5-3b-instruct-og-rloo-implicit-cheat-direct-global_step_30 3B • Updated Sep 8, 2025
xinpeng/big-math-hard-tiny-qwen2.5-3b-instruct-og-rloo-implicit-cheat-direct-global_step_45 3B • Updated Sep 8, 2025
xinpeng/big-math-hard-tiny-qwen2.5-3b-instruct-og-rloo-implicit-cheat-direct-global_step_15 3B • Updated Sep 8, 2025 • 5
xinpeng/big-math-hard-tiny-llama-3.2-3b-instruct-og-rloo-implicit-cheat-no-global-step-60-actor Updated Sep 6, 2025
xinpeng/big-math-hard-tiny-llama-3.2-3b-instruct-og-rloo-implicit-cheat-no-global_step_75 4B • Updated Sep 5, 2025
xinpeng/big-math-hard-tiny-llama-3.2-3b-instruct-og-rloo-implicit-cheat-no-global_step_85 4B • Updated Sep 5, 2025
xinpeng/big-math-hard-tiny-llama-3.2-3b-instruct-og-rloo-implicit-cheat-no-global_step_65 4B • Updated Sep 5, 2025
xinpeng/big-math-hard-tiny-llama-3.2-3b-instruct-og-rloo-implicit-cheat-no-global_step_80 4B • Updated Sep 5, 2025
xinpeng/big-math-hard-tiny-llama-3.2-3b-instruct-og-rloo-implicit-cheat-no-global_step_70 4B • Updated Sep 5, 2025