Upload train_glm47_flash.py with huggingface_hub
Browse files- train_glm47_flash.py +1 -1
train_glm47_flash.py
CHANGED
|
@@ -158,7 +158,7 @@ training_config = SFTConfig(
|
|
| 158 |
per_device_eval_batch_size=1,
|
| 159 |
gradient_accumulation_steps=16, # Effective batch size: 16
|
| 160 |
learning_rate=2e-4,
|
| 161 |
-
|
| 162 |
|
| 163 |
# Memory optimization
|
| 164 |
gradient_checkpointing=True,
|
|
|
|
| 158 |
per_device_eval_batch_size=1,
|
| 159 |
gradient_accumulation_steps=16, # Effective batch size: 16
|
| 160 |
learning_rate=2e-4,
|
| 161 |
+
max_length=1024, # Reduced for memory
|
| 162 |
|
| 163 |
# Memory optimization
|
| 164 |
gradient_checkpointing=True,
|