ertghiu256's picture
Update README.md
810fad5 verified
|
raw
history blame
166 Bytes
metadata
license: apache-2.0
datasets:
  - nvidia/OpenCodeReasoning
  - vicgalle/creative-rubrics-gpt-4.5-o3-R1
base_model:
  - unsloth/Qwen3-4B
tags:
  - unsloth
  - trl
  - sft