swapnil7777/sfpo-gxpo-qwen-3b-k-5-hendrycks-math-seed42-20260410-184131-best-checkpoint Updated Apr 11
swapnil7777/sfpo-gxpo-qwen-3b-k-5-hendrycks-math-seed42-20260410-184131-checkpoint-228 Updated Apr 11
swapnil7777/sfpo-gxpo-qwen-3b-k-5-hendrycks-math-seed42-20260410-184131-checkpoint-232 Updated Apr 11
swapnil7777/sfpo-gxpo-qwen-3b-k-5-hendrycks-math-seed42-20260410-184131-checkpoint-234 Updated Apr 11
swapnil7777/sfpo-sfpo-qwen-3b-k-3-hendrycks-math-seed42-20260410-100614-best-checkpoint Updated Apr 11
swapnil7777/sfpo-sfpo-qwen-3b-k-3-hendrycks-math-seed42-20260410-100614-checkpoint-228 Updated Apr 11
swapnil7777/sfpo-sfpo-qwen-3b-k-3-hendrycks-math-seed42-20260410-100614-checkpoint-394 Updated Apr 11
swapnil7777/sfpo-sfpo-qwen-3b-k-3-hendrycks-math-seed42-20260410-100614-checkpoint-396 Updated Apr 11
swapnil7777/sfpo-sfpo-qwen-3b-k-5-hendrycks-math-seed42-20260410-100741-best-checkpoint Updated Apr 11
swapnil7777/sfpo-sfpo-qwen-3b-k-5-hendrycks-math-seed42-20260410-100741-checkpoint-392 Updated Apr 11 • 1
swapnil7777/sfpo-sfpo-qwen-3b-k-5-hendrycks-math-seed42-20260410-100741-checkpoint-394 Updated Apr 11
swapnil7777/gxpo-gxpo-qwen-3b-k-3-shutoff-trajectory-aware-hendrycks-math-seed42-20260411-114108-be-a73dba72 Updated Apr 12
swapnil7777/gxpo-gxpo-qwen-3b-k-3-shutoff-trajectory-aware-hendrycks-math-seed42-20260411-114108-ch-8f7a9687 Updated Apr 12
swapnil7777/gxpo-gxpo-qwen-3b-k-3-shutoff-trajectory-aware-hendrycks-math-seed42-20260411-114108-ch-2393e580 Updated Apr 12
swapnil7777/gxpo-gxpo-qwen-3b-k-3-shutoff-trajectory-aware-hendrycks-math-seed42-20260411-114108-ch-9c4ebc27 Updated Apr 12
swapnil7777/gxpo-gxpo-qwen-3b-k-5-shutoff-trajectory-aware-hendrycks-math-seed42-20260411-114637-be-52f7c6e5 Updated Apr 12