micro_batch_size: 1
Browse files
scripts/pretrain-core-model.yaml
CHANGED
|
@@ -68,8 +68,8 @@ train:
|
|
| 68 |
|
| 69 |
# Number of samples per data-parallel rank (type: int, default: 4)
|
| 70 |
# micro_batch_size: 4
|
| 71 |
-
micro_batch_size: 2
|
| 72 |
-
|
| 73 |
|
| 74 |
# Number of iterations with learning rate warmup active (type: int, default: 2000)
|
| 75 |
lr_warmup_steps: 200
|
|
|
|
| 68 |
|
| 69 |
# Number of samples per data-parallel rank (type: int, default: 4)
|
| 70 |
# micro_batch_size: 4
|
| 71 |
+
# micro_batch_size: 2
|
| 72 |
+
micro_batch_size: 1
|
| 73 |
|
| 74 |
# Number of iterations with learning rate warmup active (type: int, default: 2000)
|
| 75 |
lr_warmup_steps: 200
|