ssdataanalysis commited on
Commit
76bf694
·
verified ·
1 Parent(s): b1581a4

Fix: add assistant_only_loss=False to prevent all labels being masked to -100

Browse files
Files changed (1) hide show
  1. train.py +2 -1
train.py CHANGED
@@ -122,6 +122,7 @@ training_args = SFTConfig(
122
  weight_decay=0.01,
123
  max_length=2048,
124
  packing=False,
 
125
  bf16=True,
126
  logging_strategy="steps",
127
  logging_steps=10,
@@ -133,7 +134,7 @@ training_args = SFTConfig(
133
  push_to_hub=True,
134
  hub_model_id=output_dir,
135
  report_to="trackio",
136
- run_name=output_dir.replace("/", "-") + "-optimal-resume",
137
  remove_unused_columns=False,
138
  disable_tqdm=True,
139
  dataset_num_proc=4,
 
122
  weight_decay=0.01,
123
  max_length=2048,
124
  packing=False,
125
+ assistant_only_loss=False, # CRITICAL FIX: prevent all labels being masked to -100
126
  bf16=True,
127
  logging_strategy="steps",
128
  logging_steps=10,
 
134
  push_to_hub=True,
135
  hub_model_id=output_dir,
136
  report_to="trackio",
137
+ run_name=output_dir.replace("/", "-") + "-optimal",
138
  remove_unused_columns=False,
139
  disable_tqdm=True,
140
  dataset_num_proc=4,