| *.7z filter=lfs diff=lfs merge=lfs -text | |
| *.arrow filter=lfs diff=lfs merge=lfs -text | |
| *.bin filter=lfs diff=lfs merge=lfs -text | |
| *.bz2 filter=lfs diff=lfs merge=lfs -text | |
| *.ckpt filter=lfs diff=lfs merge=lfs -text | |
| *.ftz filter=lfs diff=lfs merge=lfs -text | |
| *.gz filter=lfs diff=lfs merge=lfs -text | |
| *.h5 filter=lfs diff=lfs merge=lfs -text | |
| *.joblib filter=lfs diff=lfs merge=lfs -text | |
| *.lfs.* filter=lfs diff=lfs merge=lfs -text | |
| *.mlmodel filter=lfs diff=lfs merge=lfs -text | |
| *.model filter=lfs diff=lfs merge=lfs -text | |
| *.msgpack filter=lfs diff=lfs merge=lfs -text | |
| *.npy filter=lfs diff=lfs merge=lfs -text | |
| *.npz filter=lfs diff=lfs merge=lfs -text | |
| *.onnx filter=lfs diff=lfs merge=lfs -text | |
| *.ot filter=lfs diff=lfs merge=lfs -text | |
| *.parquet filter=lfs diff=lfs merge=lfs -text | |
| *.pb filter=lfs diff=lfs merge=lfs -text | |
| *.pickle filter=lfs diff=lfs merge=lfs -text | |
| *.pkl filter=lfs diff=lfs merge=lfs -text | |
| *.pt filter=lfs diff=lfs merge=lfs -text | |
| *.pth filter=lfs diff=lfs merge=lfs -text | |
| *.rar filter=lfs diff=lfs merge=lfs -text | |
| *.safetensors filter=lfs diff=lfs merge=lfs -text | |
| saved_model/**/* filter=lfs diff=lfs merge=lfs -text | |
| *.tar.* filter=lfs diff=lfs merge=lfs -text | |
| *.tar filter=lfs diff=lfs merge=lfs -text | |
| *.tflite filter=lfs diff=lfs merge=lfs -text | |
| *.tgz filter=lfs diff=lfs merge=lfs -text | |
| *.wasm filter=lfs diff=lfs merge=lfs -text | |
| *.xz filter=lfs diff=lfs merge=lfs -text | |
| *.zip filter=lfs diff=lfs merge=lfs -text | |
| *.zst filter=lfs diff=lfs merge=lfs -text | |
| *tfevents* filter=lfs diff=lfs merge=lfs -text | |
| verl_math_Qwen2p5Math7B_NegRAFT_correct_rerun/global_step_400/actor/huggingface/tokenizer.json filter=lfs diff=lfs merge=lfs -text | |
| verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/rollouts/72.jsonl filter=lfs diff=lfs merge=lfs -text | |
| verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/rollouts/67.jsonl filter=lfs diff=lfs merge=lfs -text | |
| verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/rollouts/80.jsonl filter=lfs diff=lfs merge=lfs -text | |
| verl_math_Qwen2p5Math7B_NegRAFT_onpolicy_numina_hard_rerun_DRGRPO_norm/rollouts/379.jsonl filter=lfs diff=lfs merge=lfs -text | |
| verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/rollouts/6.jsonl filter=lfs diff=lfs merge=lfs -text | |
| verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/rollouts/28.jsonl filter=lfs diff=lfs merge=lfs -text | |
| verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/rollouts/25.jsonl filter=lfs diff=lfs merge=lfs -text | |
| verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/rollouts/26.jsonl filter=lfs diff=lfs merge=lfs -text | |
| verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/rollouts/57.jsonl filter=lfs diff=lfs merge=lfs -text | |
| verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/rollouts/7.jsonl filter=lfs diff=lfs merge=lfs -text | |
| verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/rollouts/32.jsonl filter=lfs diff=lfs merge=lfs -text | |
| verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/rollouts/73.jsonl filter=lfs diff=lfs merge=lfs -text | |
| verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/rollouts/63.jsonl filter=lfs diff=lfs merge=lfs -text | |
| verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/rollouts/74.jsonl filter=lfs diff=lfs merge=lfs -text | |
| verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/rollouts/62.jsonl filter=lfs diff=lfs merge=lfs -text | |
| verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/rollouts/47.jsonl filter=lfs diff=lfs merge=lfs -text | |
| verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/rollouts/8.jsonl filter=lfs diff=lfs merge=lfs -text | |
| verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/rollouts/77.jsonl filter=lfs diff=lfs merge=lfs -text | |
| verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/rollouts/24.jsonl filter=lfs diff=lfs merge=lfs -text | |
| verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/rollouts/30.jsonl filter=lfs diff=lfs merge=lfs -text | |
| verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/rollouts/56.jsonl filter=lfs diff=lfs merge=lfs -text | |
| verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/rollouts/38.jsonl filter=lfs diff=lfs merge=lfs -text | |
| verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/rollouts/9.jsonl filter=lfs diff=lfs merge=lfs -text | |
| verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/rollouts/61.jsonl filter=lfs diff=lfs merge=lfs -text | |
| verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/rollouts/23.jsonl filter=lfs diff=lfs merge=lfs -text | |
| verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/rollouts/27.jsonl filter=lfs diff=lfs merge=lfs -text | |
| verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/rollouts/41.jsonl filter=lfs diff=lfs merge=lfs -text | |
| verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/rollouts/66.jsonl filter=lfs diff=lfs merge=lfs -text | |
| verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/rollouts/34.jsonl filter=lfs diff=lfs merge=lfs -text | |
| verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/rollouts/71.jsonl filter=lfs diff=lfs merge=lfs -text | |
| verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/rollouts/39.jsonl filter=lfs diff=lfs merge=lfs -text | |
| verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/rollouts/64.jsonl filter=lfs diff=lfs merge=lfs -text | |
| verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/rollouts/76.jsonl filter=lfs diff=lfs merge=lfs -text | |
| verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/rollouts/36.jsonl filter=lfs diff=lfs merge=lfs -text | |
| verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/rollouts/42.jsonl filter=lfs diff=lfs merge=lfs -text | |
| verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/rollouts/17.jsonl filter=lfs diff=lfs merge=lfs -text | |
| verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/rollouts/11.jsonl filter=lfs diff=lfs merge=lfs -text | |
| verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/rollouts/16.jsonl filter=lfs diff=lfs merge=lfs -text | |
| verl_math_Qwen2p5Math7B_NegRAFT_onpolicy_numina_hard_rerun_DRGRPO_norm/rollouts/378.jsonl filter=lfs diff=lfs merge=lfs -text | |
| verl_math_Qwen2p5Math7B_NegRAFT_onpolicy_numina_hard_rerun_DRGRPO_norm/rollouts/377.jsonl filter=lfs diff=lfs merge=lfs -text | |
| verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/rollouts/69.jsonl filter=lfs diff=lfs merge=lfs -text | |
| verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/rollouts/29.jsonl filter=lfs diff=lfs merge=lfs -text | |
| verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/rollouts/68.jsonl filter=lfs diff=lfs merge=lfs -text | |
| verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/rollouts/75.jsonl filter=lfs diff=lfs merge=lfs -text | |
| verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/rollouts/48.jsonl filter=lfs diff=lfs merge=lfs -text | |
| verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/rollouts/52.jsonl filter=lfs diff=lfs merge=lfs -text | |
| verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/rollouts/40.jsonl filter=lfs diff=lfs merge=lfs -text | |
| verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/rollouts/78.jsonl filter=lfs diff=lfs merge=lfs -text | |
| verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/rollouts/50.jsonl filter=lfs diff=lfs merge=lfs -text | |
| verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/rollouts/51.jsonl filter=lfs diff=lfs merge=lfs -text | |
| verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/rollouts/46.jsonl filter=lfs diff=lfs merge=lfs -text | |
| verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/rollouts/53.jsonl filter=lfs diff=lfs merge=lfs -text | |
| verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/rollouts/79.jsonl filter=lfs diff=lfs merge=lfs -text | |
| verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/rollouts/35.jsonl filter=lfs diff=lfs merge=lfs -text | |
| verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/rollouts/31.jsonl filter=lfs diff=lfs merge=lfs -text | |
| verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/rollouts/55.jsonl filter=lfs diff=lfs merge=lfs -text | |
| verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/rollouts/54.jsonl filter=lfs diff=lfs merge=lfs -text | |
| verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/rollouts/37.jsonl filter=lfs diff=lfs merge=lfs -text | |
| verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/rollouts/33.jsonl filter=lfs diff=lfs merge=lfs -text | |
| verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/rollouts/65.jsonl filter=lfs diff=lfs merge=lfs -text | |
| verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/rollouts/70.jsonl filter=lfs diff=lfs merge=lfs -text | |
| verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/rollouts/10.jsonl filter=lfs diff=lfs merge=lfs -text | |
| verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/rollouts/14.jsonl filter=lfs diff=lfs merge=lfs -text | |
| verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/rollouts/15.jsonl filter=lfs diff=lfs merge=lfs -text | |
| verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/rollouts/12.jsonl filter=lfs diff=lfs merge=lfs -text | |
| verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/rollouts/43.jsonl filter=lfs diff=lfs merge=lfs -text | |
| verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/rollouts/13.jsonl filter=lfs diff=lfs merge=lfs -text | |
| verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/rollouts/44.jsonl filter=lfs diff=lfs merge=lfs -text | |
| verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/rollouts/18.jsonl filter=lfs diff=lfs merge=lfs -text | |
| verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/rollouts/45.jsonl filter=lfs diff=lfs merge=lfs -text | |
| verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/rollouts/20.jsonl filter=lfs diff=lfs merge=lfs -text | |
| verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/rollouts/49.jsonl filter=lfs diff=lfs merge=lfs -text | |
| verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/verl_math_Qwen2p5Math7B_NegativeLoss_32_cosine_logalso_run_tokenmean/rollouts/19.jsonl filter=lfs diff=lfs merge=lfs -text | |
| verl_math_Qwen2p5Math7B_NegLoss_onpolicy_numina_hard_rerun_DRGRPO_norm/rollouts/294.jsonl filter=lfs diff=lfs merge=lfs -text | |