Upload scripts/train_alizee_v2_stage1_sft.py with huggingface_hub
Browse files
scripts/train_alizee_v2_stage1_sft.py
CHANGED
|
@@ -270,7 +270,7 @@ training_config = SFTConfig(
|
|
| 270 |
per_device_eval_batch_size=PER_DEVICE_BATCH,
|
| 271 |
gradient_accumulation_steps=GRADIENT_ACCUMULATION,
|
| 272 |
learning_rate=LEARNING_RATE,
|
| 273 |
-
|
| 274 |
|
| 275 |
# Optimization
|
| 276 |
warmup_ratio=WARMUP_RATIO,
|
|
|
|
| 270 |
per_device_eval_batch_size=PER_DEVICE_BATCH,
|
| 271 |
gradient_accumulation_steps=GRADIENT_ACCUMULATION,
|
| 272 |
learning_rate=LEARNING_RATE,
|
| 273 |
+
max_length=MAX_SEQ_LENGTH, # TRL uses max_length, not max_seq_length
|
| 274 |
|
| 275 |
# Optimization
|
| 276 |
warmup_ratio=WARMUP_RATIO,
|