Upload train_code_reasoning.py
Browse files- train_code_reasoning.py +8 -3
train_code_reasoning.py
CHANGED
|
@@ -13,6 +13,7 @@
|
|
| 13 |
import os
|
| 14 |
import random
|
| 15 |
from datasets import load_dataset, concatenate_datasets
|
|
|
|
| 16 |
from trl import SFTTrainer, SFTConfig
|
| 17 |
import trackio
|
| 18 |
|
|
@@ -24,6 +25,9 @@ OUTPUT_DIR = "./code-reasoning-1.5b"
|
|
| 24 |
# Initialize Trackio
|
| 25 |
trackio.init(project="code-reasoning-ft", name="qwen2.5-coder-1.5b-code-reasoning")
|
| 26 |
|
|
|
|
|
|
|
|
|
|
| 27 |
print("Loading and preparing datasets...")
|
| 28 |
|
| 29 |
all_datasets = []
|
|
@@ -159,8 +163,8 @@ training_args = SFTConfig(
|
|
| 159 |
hub_model_id=HUB_MODEL_ID,
|
| 160 |
push_to_hub=True,
|
| 161 |
num_train_epochs=2,
|
| 162 |
-
per_device_train_batch_size=
|
| 163 |
-
gradient_accumulation_steps=
|
| 164 |
learning_rate=5e-5,
|
| 165 |
warmup_steps=300,
|
| 166 |
lr_scheduler_type="cosine",
|
|
@@ -171,7 +175,7 @@ training_args = SFTConfig(
|
|
| 171 |
logging_first_step=True,
|
| 172 |
save_strategy="steps",
|
| 173 |
save_steps=10,
|
| 174 |
-
packing=
|
| 175 |
dataset_num_proc=4,
|
| 176 |
disable_tqdm=True,
|
| 177 |
report_to=["trackio"],
|
|
@@ -184,6 +188,7 @@ trainer = SFTTrainer(
|
|
| 184 |
model=MODEL_ID,
|
| 185 |
train_dataset=train_dataset,
|
| 186 |
args=training_args,
|
|
|
|
| 187 |
)
|
| 188 |
|
| 189 |
print("Starting training...")
|
|
|
|
| 13 |
import os
|
| 14 |
import random
|
| 15 |
from datasets import load_dataset, concatenate_datasets
|
| 16 |
+
from transformers import AutoTokenizer
|
| 17 |
from trl import SFTTrainer, SFTConfig
|
| 18 |
import trackio
|
| 19 |
|
|
|
|
| 25 |
# Initialize Trackio
|
| 26 |
trackio.init(project="code-reasoning-ft", name="qwen2.5-coder-1.5b-code-reasoning")
|
| 27 |
|
| 28 |
+
# Load tokenizer
|
| 29 |
+
tokenizer = AutoTokenizer.from_pretrained(MODEL_ID, trust_remote_code=True)
|
| 30 |
+
|
| 31 |
print("Loading and preparing datasets...")
|
| 32 |
|
| 33 |
all_datasets = []
|
|
|
|
| 163 |
hub_model_id=HUB_MODEL_ID,
|
| 164 |
push_to_hub=True,
|
| 165 |
num_train_epochs=2,
|
| 166 |
+
per_device_train_batch_size=2,
|
| 167 |
+
gradient_accumulation_steps=8,
|
| 168 |
learning_rate=5e-5,
|
| 169 |
warmup_steps=300,
|
| 170 |
lr_scheduler_type="cosine",
|
|
|
|
| 175 |
logging_first_step=True,
|
| 176 |
save_strategy="steps",
|
| 177 |
save_steps=10,
|
| 178 |
+
packing=False,
|
| 179 |
dataset_num_proc=4,
|
| 180 |
disable_tqdm=True,
|
| 181 |
report_to=["trackio"],
|
|
|
|
| 188 |
model=MODEL_ID,
|
| 189 |
train_dataset=train_dataset,
|
| 190 |
args=training_args,
|
| 191 |
+
processing_class=tokenizer,
|
| 192 |
)
|
| 193 |
|
| 194 |
print("Starting training...")
|