SofT-GRPO-master / .gitattributes
zz1358m's picture
Upload mainprocess.png
f6973b1 verified
*.7z filter=lfs diff=lfs merge=lfs -text
*.arrow filter=lfs diff=lfs merge=lfs -text
*.bin filter=lfs diff=lfs merge=lfs -text
*.bz2 filter=lfs diff=lfs merge=lfs -text
*.ckpt filter=lfs diff=lfs merge=lfs -text
*.ftz filter=lfs diff=lfs merge=lfs -text
*.gz filter=lfs diff=lfs merge=lfs -text
*.h5 filter=lfs diff=lfs merge=lfs -text
*.joblib filter=lfs diff=lfs merge=lfs -text
*.lfs.* filter=lfs diff=lfs merge=lfs -text
*.mlmodel filter=lfs diff=lfs merge=lfs -text
*.model filter=lfs diff=lfs merge=lfs -text
*.msgpack filter=lfs diff=lfs merge=lfs -text
*.npy filter=lfs diff=lfs merge=lfs -text
*.npz filter=lfs diff=lfs merge=lfs -text
*.onnx filter=lfs diff=lfs merge=lfs -text
*.ot filter=lfs diff=lfs merge=lfs -text
*.parquet filter=lfs diff=lfs merge=lfs -text
*.pb filter=lfs diff=lfs merge=lfs -text
*.pickle filter=lfs diff=lfs merge=lfs -text
*.pkl filter=lfs diff=lfs merge=lfs -text
*.pt filter=lfs diff=lfs merge=lfs -text
*.pth filter=lfs diff=lfs merge=lfs -text
*.rar filter=lfs diff=lfs merge=lfs -text
*.safetensors filter=lfs diff=lfs merge=lfs -text
saved_model/**/* filter=lfs diff=lfs merge=lfs -text
*.tar.* filter=lfs diff=lfs merge=lfs -text
*.tar filter=lfs diff=lfs merge=lfs -text
*.tflite filter=lfs diff=lfs merge=lfs -text
*.tgz filter=lfs diff=lfs merge=lfs -text
*.wasm filter=lfs diff=lfs merge=lfs -text
*.xz filter=lfs diff=lfs merge=lfs -text
*.zip filter=lfs diff=lfs merge=lfs -text
*.zst filter=lfs diff=lfs merge=lfs -text
*tfevents* filter=lfs diff=lfs merge=lfs -text
Results/testing-results/1.5B-GRPO-discrete-token-output-temperature=0.6.txt filter=lfs diff=lfs merge=lfs -text
Results/testing-results/1.5B-GRPO-soft-output-temperature=0.6.txt filter=lfs diff=lfs merge=lfs -text
Results/testing-results/1.5B-Soft-GRPO-soft-thinking-output.txt filter=lfs diff=lfs merge=lfs -text
Results/testing-results/1.5B-nofinetune-discrete-token-output-temperature=0.6.txt filter=lfs diff=lfs merge=lfs -text
Results/testing-results/1.5B-nofinetune-soft-output-temperature=0.6.txt filter=lfs diff=lfs merge=lfs -text
Soft-Thinking+noise+loss-main/imgs/paper.jpeg filter=lfs diff=lfs merge=lfs -text
Soft-Thinking+noise+loss-main/sglang_soft_thinking_pkg/assets/logo.png filter=lfs diff=lfs merge=lfs -text
Soft-Thinking+noise+loss-main/sglang_soft_thinking_pkg/docs/_static/image/logo.png filter=lfs diff=lfs merge=lfs -text
Soft-Thinking+noise+loss-main/sglang_soft_thinking_pkg/examples/frontend_language/quick_start/images/cat.jpeg filter=lfs diff=lfs merge=lfs -text
Soft-Thinking+noise+loss-main/sglang_soft_thinking_pkg/examples/frontend_language/quick_start/images/dog.jpeg filter=lfs diff=lfs merge=lfs -text
saved_weight/Deepeeek-Qwen-1.5B+GRPO/tokenizer.json filter=lfs diff=lfs merge=lfs -text
saved_weight/Deepeeek-Qwen-1.5B+SofT-GRPO/tokenizer.json filter=lfs diff=lfs merge=lfs -text
saved_weight/Deepeeek-Qwen-7B+GRPO/tokenizer.json filter=lfs diff=lfs merge=lfs -text
saved_weight/Deepeeek-Qwen-7B+SofT-GRPO/tokenizer.json filter=lfs diff=lfs merge=lfs -text
saved_weight/LlaMA3.2-3B-Instruct+GRPO/tokenizer.json filter=lfs diff=lfs merge=lfs -text
saved_weight/LlaMA3.2-3B-Instruct+SofT-GRPO/tokenizer.json filter=lfs diff=lfs merge=lfs -text
assets/mainprocess.png filter=lfs diff=lfs merge=lfs -text