| license: mit | |
| tags: | |
| - unsloth | |
| - trl | |
| - sft | |
| datasets: | |
| - HUGG222/R1-Like-Dataset | |
| language: | |
| - en | |
| base_model: | |
| - Qwen/Qwen2.5-3B-Instruct | |
| license: mit | |
| tags: | |
| - unsloth | |
| - trl | |
| - sft | |
| datasets: | |
| - HUGG222/R1-Like-Dataset | |
| language: | |
| - en | |
| base_model: | |
| - Qwen/Qwen2.5-3B-Instruct | |