Upload train.py with huggingface_hub
Browse files
train.py
CHANGED
|
@@ -60,7 +60,7 @@ def main():
|
|
| 60 |
per_device_train_batch_size=1,
|
| 61 |
gradient_accumulation_steps=8,
|
| 62 |
learning_rate=2e-4,
|
| 63 |
-
|
| 64 |
|
| 65 |
# Logging & checkpointing
|
| 66 |
logging_steps=10,
|
|
|
|
| 60 |
per_device_train_batch_size=1,
|
| 61 |
gradient_accumulation_steps=8,
|
| 62 |
learning_rate=2e-4,
|
| 63 |
+
# NOTE: max_seq_length is NOT supported in SFTConfig (trl>=0.12.0) — removed
|
| 64 |
|
| 65 |
# Logging & checkpointing
|
| 66 |
logging_steps=10,
|