RLVR-SGDM-Gap / .gitattributes
DatPySci's picture
Upload synthetic/Qwen2.5-3B-Instruct-Polaris/polaris_t0.7_p1.0_n32-MNT3072.jsonl with huggingface_hub
122c251 verified
raw
history blame
11.2 kB
*.7z filter=lfs diff=lfs merge=lfs -text
*.arrow filter=lfs diff=lfs merge=lfs -text
*.bin filter=lfs diff=lfs merge=lfs -text
*.bz2 filter=lfs diff=lfs merge=lfs -text
*.ckpt filter=lfs diff=lfs merge=lfs -text
*.ftz filter=lfs diff=lfs merge=lfs -text
*.gz filter=lfs diff=lfs merge=lfs -text
*.h5 filter=lfs diff=lfs merge=lfs -text
*.joblib filter=lfs diff=lfs merge=lfs -text
*.lfs.* filter=lfs diff=lfs merge=lfs -text
*.mlmodel filter=lfs diff=lfs merge=lfs -text
*.model filter=lfs diff=lfs merge=lfs -text
*.msgpack filter=lfs diff=lfs merge=lfs -text
*.npy filter=lfs diff=lfs merge=lfs -text
*.npz filter=lfs diff=lfs merge=lfs -text
*.onnx filter=lfs diff=lfs merge=lfs -text
*.ot filter=lfs diff=lfs merge=lfs -text
*.parquet filter=lfs diff=lfs merge=lfs -text
*.pb filter=lfs diff=lfs merge=lfs -text
*.pickle filter=lfs diff=lfs merge=lfs -text
*.pkl filter=lfs diff=lfs merge=lfs -text
*.pt filter=lfs diff=lfs merge=lfs -text
*.pth filter=lfs diff=lfs merge=lfs -text
*.rar filter=lfs diff=lfs merge=lfs -text
*.safetensors filter=lfs diff=lfs merge=lfs -text
saved_model/**/* filter=lfs diff=lfs merge=lfs -text
*.tar.* filter=lfs diff=lfs merge=lfs -text
*.tar filter=lfs diff=lfs merge=lfs -text
*.tflite filter=lfs diff=lfs merge=lfs -text
*.tgz filter=lfs diff=lfs merge=lfs -text
*.wasm filter=lfs diff=lfs merge=lfs -text
*.xz filter=lfs diff=lfs merge=lfs -text
*.zip filter=lfs diff=lfs merge=lfs -text
*.zst filter=lfs diff=lfs merge=lfs -text
*tfevents* filter=lfs diff=lfs merge=lfs -text
Qwen2.5-3B-Instruct-polaris-AdamW-GRPO-bsz16-step64/huggingface/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Qwen2.5-3B-Instruct-polaris-AdamW-GRPO-bsz32-step64/huggingface/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Qwen2.5-3B-Instruct-polaris-AdamW-GRPO/bsz32/step64/huggingface/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Qwen2.5-3B-Instruct-polaris-AdamW-GRPO/bsz32/step128/huggingface/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Qwen2.5-3B-Instruct-polaris-AdamW-GRPO/bsz32/step192/huggingface/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Qwen2.5-3B-Instruct-polaris-AdamW-GRPO/bsz32/step256/huggingface/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Qwen2.5-3B-Instruct-polaris-AdamW-GRPO/bsz64/step64/huggingface/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Qwen2.5-3B-Instruct-polaris-AdamW-GRPO/bsz64/step128/huggingface/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Qwen2.5-3B-Instruct-polaris-AdamW-GRPO/bsz64/step192/huggingface/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Qwen2.5-3B-Instruct-polaris-AdamW-GRPO/bsz64/step256/huggingface/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Qwen2.5-3B-Instruct-polaris-AdamW-GRPO/bsz32/step320/huggingface/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Qwen2.5-3B-Instruct-polaris-AdamW-GRPO/bsz32/step384/huggingface/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Qwen2.5-3B-Instruct-polaris-AdamW-GRPO/bsz32/step448/huggingface/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Qwen2.5-3B-Instruct-polaris-AdamW-GRPO/bsz32/step512/huggingface/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Qwen2.5-3B-Instruct-polaris-AdamW-GRPO/bsz64/step384/huggingface/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Qwen2.5-3B-Instruct-polaris-AdamW-GRPO/bsz64/step448/huggingface/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Qwen2.5-3B-Instruct-polaris-AdamW-GRPO/bsz64/step512/huggingface/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Qwen2.5-3B-Instruct-polaris-AdamW-GRPO/bsz128/step64/huggingface/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Qwen2.5-3B-Instruct-polaris-AdamW-GRPO/bsz128/step128/huggingface/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Qwen2.5-3B-Instruct-polaris-AdamW-GRPO/bsz128/step192/huggingface/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Qwen2.5-3B-Instruct-polaris-AdamW-GRPO/bsz128/step256/huggingface/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Qwen2.5-3B-Instruct-polaris-AdamW-GRPO/bsz128/step320/huggingface/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Qwen2.5-3B-Instruct-polaris-AdamW-GRPO/bsz128/step384/huggingface/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Qwen2.5-3B-Instruct-polaris-AdamW-GRPO/bsz128/step448/huggingface/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Qwen2.5-3B-Instruct-polaris-AdamW-GRPO/bsz128/step512/huggingface/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Qwen2.5-3B-Instruct-polaris-AdamW-GRPO/bsz256/step64/huggingface/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Qwen2.5-3B-Instruct-polaris-AdamW-GRPO/bsz256/step128/huggingface/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Qwen2.5-3B-Instruct-polaris-AdamW-GRPO/bsz256/step192/huggingface/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Qwen2.5-3B-Instruct-polaris-AdamW-GRPO/bsz256/step256/huggingface/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Qwen2.5-3B-Instruct-polaris-AdamW-GRPO/bsz256/step320/huggingface/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Qwen2.5-3B-Instruct-polaris-AdamW-GRPO/bsz256/step384/huggingface/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Qwen2.5-3B-Instruct-polaris-AdamW-GRPO/bsz256/step448/huggingface/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Qwen2.5-3B-Instruct-polaris-AdamW-GRPO/bsz256/step512/huggingface/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Llama-3.2-3B-Instruct-polaris-GRPO--bsz32/global_step_192/actor_hf/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Llama-3.2-3B-Instruct-polaris-GRPO--bsz16/global_step_64/actor_hf/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Llama-3.2-3B-Instruct-polaris-GRPO--bsz256/global_step_512/actor_hf/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Llama-3.2-3B-Instruct-polaris-GRPO--bsz512/global_step_192/actor_hf/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Llama-3.2-3B-Instruct-polaris-GRPO--bsz16/global_step_256/actor_hf/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Llama-3.2-3B-Instruct-polaris-GRPO--bsz128/global_step_192/actor_hf/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Llama-3.2-3B-Instruct-polaris-GRPO--bsz32/global_step_320/actor_hf/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Llama-3.2-3B-Instruct-polaris-GRPO--bsz32/global_step_512/actor_hf/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Llama-3.2-3B-Instruct-polaris-GRPO--bsz128/global_step_256/actor_hf/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Llama-3.2-3B-Instruct-polaris-GRPO--bsz64/global_step_320/actor_hf/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Llama-3.2-3B-Instruct-polaris-GRPO--bsz16/global_step_128/actor_hf/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Llama-3.2-3B-Instruct-polaris-GRPO--bsz256/global_step_128/actor_hf/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Llama-3.2-3B-Instruct-polaris-GRPO--bsz32/global_step_256/actor_hf/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Llama-3.2-3B-Instruct-polaris-GRPO--bsz256/global_step_384/actor_hf/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Llama-3.2-3B-Instruct-polaris-GRPO--bsz512/global_step_448/actor_hf/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Llama-3.2-3B-Instruct-polaris-GRPO--bsz64/global_step_192/actor_hf/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Llama-3.2-3B-Instruct-polaris-GRPO--bsz512/global_step_384/actor_hf/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Llama-3.2-3B-Instruct-polaris-GRPO--bsz16/global_step_512/actor_hf/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Llama-3.2-3B-Instruct-polaris-GRPO--bsz128/global_step_128/actor_hf/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Llama-3.2-3B-Instruct-polaris-GRPO--bsz256/global_step_448/actor_hf/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Llama-3.2-3B-Instruct-polaris-GRPO--bsz128/global_step_512/actor_hf/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Llama-3.2-3B-Instruct-polaris-GRPO--bsz512/global_step_320/actor_hf/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Llama-3.2-3B-Instruct-polaris-GRPO--bsz64/global_step_128/actor_hf/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Llama-3.2-3B-Instruct-polaris-GRPO--bsz64/global_step_256/actor_hf/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Llama-3.2-3B-Instruct-polaris-GRPO--bsz64/global_step_384/actor_hf/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Llama-3.2-3B-Instruct-polaris-GRPO--bsz64/global_step_64/actor_hf/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Llama-3.2-3B-Instruct-polaris-GRPO--bsz256/global_step_256/actor_hf/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Llama-3.2-3B-Instruct-polaris-GRPO--bsz64/global_step_448/actor_hf/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Llama-3.2-3B-Instruct-polaris-GRPO--bsz128/global_step_64/actor_hf/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Llama-3.2-3B-Instruct-polaris-GRPO--bsz256/global_step_320/actor_hf/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Llama-3.2-3B-Instruct-polaris-GRPO--bsz16/global_step_448/actor_hf/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Llama-3.2-3B-Instruct-polaris-GRPO--bsz512/global_step_512/actor_hf/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Llama-3.2-3B-Instruct-polaris-GRPO--bsz128/global_step_448/actor_hf/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Llama-3.2-3B-Instruct-polaris-GRPO--bsz64/global_step_512/actor_hf/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Llama-3.2-3B-Instruct-polaris-GRPO--bsz32/global_step_448/actor_hf/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Llama-3.2-3B-Instruct-polaris-GRPO--bsz32/global_step_64/actor_hf/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Llama-3.2-3B-Instruct-polaris-GRPO--bsz256/global_step_192/actor_hf/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Llama-3.2-3B-Instruct-polaris-GRPO--bsz512/global_step_256/actor_hf/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Llama-3.2-3B-Instruct-polaris-GRPO--bsz32/global_step_128/actor_hf/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Llama-3.2-3B-Instruct-polaris-GRPO--bsz16/global_step_192/actor_hf/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Llama-3.2-3B-Instruct-polaris-GRPO--bsz512/global_step_128/actor_hf/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Llama-3.2-3B-Instruct-polaris-GRPO--bsz512/global_step_64/actor_hf/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Llama-3.2-3B-Instruct-polaris-GRPO--bsz16/global_step_384/actor_hf/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Llama-3.2-3B-Instruct-polaris-GRPO--bsz128/global_step_384/actor_hf/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Llama-3.2-3B-Instruct-polaris-GRPO--bsz16/global_step_320/actor_hf/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Llama-3.2-3B-Instruct-polaris-GRPO--bsz32/global_step_384/actor_hf/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Llama-3.2-3B-Instruct-polaris-GRPO--bsz128/global_step_320/actor_hf/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Llama-3.2-3B-Instruct-polaris-GRPO--bsz256/global_step_64/actor_hf/tokenizer.json filter=lfs diff=lfs merge=lfs -text
synthetic/Qwen2.5-0.5B-GSM8k-synthetic.jsonl filter=lfs diff=lfs merge=lfs -text
synthetic/Qwen2.5-3B-Instruct-Polaris/polaris_t0.7_p1.0_n32-MNT3072.jsonl filter=lfs diff=lfs merge=lfs -text