Upload train_glm47_flash_test.py with huggingface_hub
Browse files
train_glm47_flash_test.py
CHANGED
|
@@ -126,7 +126,7 @@ training_config = SFTConfig(
|
|
| 126 |
per_device_train_batch_size=1,
|
| 127 |
gradient_accumulation_steps=4,
|
| 128 |
learning_rate=2e-4,
|
| 129 |
-
|
| 130 |
gradient_checkpointing=True,
|
| 131 |
gradient_checkpointing_kwargs={"use_reentrant": False},
|
| 132 |
logging_steps=5,
|
|
|
|
| 126 |
per_device_train_batch_size=1,
|
| 127 |
gradient_accumulation_steps=4,
|
| 128 |
learning_rate=2e-4,
|
| 129 |
+
max_length=512, # Short for testing
|
| 130 |
gradient_checkpointing=True,
|
| 131 |
gradient_checkpointing_kwargs={"use_reentrant": False},
|
| 132 |
logging_steps=5,
|