metadata
license: apache-2.0
datasets:
- nvidia/OpenCodeReasoning
- vicgalle/creative-rubrics-gpt-4.5-o3-R1
base_model:
- unsloth/Qwen3-4B
tags:
- unsloth
- trl
- sft