moos124 commited on
Commit
0160100
·
verified ·
1 Parent(s): 69a3f67

Upload train_code_reasoning.py

Browse files
Files changed (1) hide show
  1. train_code_reasoning.py +8 -3
train_code_reasoning.py CHANGED
@@ -13,6 +13,7 @@
13
  import os
14
  import random
15
  from datasets import load_dataset, concatenate_datasets
 
16
  from trl import SFTTrainer, SFTConfig
17
  import trackio
18
 
@@ -24,6 +25,9 @@ OUTPUT_DIR = "./code-reasoning-1.5b"
24
  # Initialize Trackio
25
  trackio.init(project="code-reasoning-ft", name="qwen2.5-coder-1.5b-code-reasoning")
26
 
 
 
 
27
  print("Loading and preparing datasets...")
28
 
29
  all_datasets = []
@@ -159,8 +163,8 @@ training_args = SFTConfig(
159
  hub_model_id=HUB_MODEL_ID,
160
  push_to_hub=True,
161
  num_train_epochs=2,
162
- per_device_train_batch_size=4,
163
- gradient_accumulation_steps=4,
164
  learning_rate=5e-5,
165
  warmup_steps=300,
166
  lr_scheduler_type="cosine",
@@ -171,7 +175,7 @@ training_args = SFTConfig(
171
  logging_first_step=True,
172
  save_strategy="steps",
173
  save_steps=10,
174
- packing=True,
175
  dataset_num_proc=4,
176
  disable_tqdm=True,
177
  report_to=["trackio"],
@@ -184,6 +188,7 @@ trainer = SFTTrainer(
184
  model=MODEL_ID,
185
  train_dataset=train_dataset,
186
  args=training_args,
 
187
  )
188
 
189
  print("Starting training...")
 
13
  import os
14
  import random
15
  from datasets import load_dataset, concatenate_datasets
16
+ from transformers import AutoTokenizer
17
  from trl import SFTTrainer, SFTConfig
18
  import trackio
19
 
 
25
  # Initialize Trackio
26
  trackio.init(project="code-reasoning-ft", name="qwen2.5-coder-1.5b-code-reasoning")
27
 
28
+ # Load tokenizer
29
+ tokenizer = AutoTokenizer.from_pretrained(MODEL_ID, trust_remote_code=True)
30
+
31
  print("Loading and preparing datasets...")
32
 
33
  all_datasets = []
 
163
  hub_model_id=HUB_MODEL_ID,
164
  push_to_hub=True,
165
  num_train_epochs=2,
166
+ per_device_train_batch_size=2,
167
+ gradient_accumulation_steps=8,
168
  learning_rate=5e-5,
169
  warmup_steps=300,
170
  lr_scheduler_type="cosine",
 
175
  logging_first_step=True,
176
  save_strategy="steps",
177
  save_steps=10,
178
+ packing=False,
179
  dataset_num_proc=4,
180
  disable_tqdm=True,
181
  report_to=["trackio"],
 
188
  model=MODEL_ID,
189
  train_dataset=train_dataset,
190
  args=training_args,
191
+ processing_class=tokenizer,
192
  )
193
 
194
  print("Starting training...")