Update README.md
Browse files
README.md
CHANGED
|
@@ -98,7 +98,7 @@ lora_layers: 32
|
|
| 98 |
batch_size: 1
|
| 99 |
|
| 100 |
# Iterations to train for.
|
| 101 |
-
iters:
|
| 102 |
|
| 103 |
# Number of validation batches, -1 uses the entire validation set.
|
| 104 |
val_batches: 25
|
|
@@ -144,9 +144,9 @@ lora_parameters:
|
|
| 144 |
dropout: 0.05
|
| 145 |
|
| 146 |
# Schedule can only be specified in a config file, uncomment to use.
|
| 147 |
-
lr_schedule:
|
| 148 |
-
name: cosine_decay
|
| 149 |
-
warmup: 100 # 0 for no warmup
|
| 150 |
-
warmup_init: 1e-7 # 0 if not specified
|
| 151 |
-
arguments: [1e-6, 1000, 1e-7] # passed to scheduler
|
| 152 |
```
|
|
|
|
| 98 |
batch_size: 1
|
| 99 |
|
| 100 |
# Iterations to train for.
|
| 101 |
+
iters: 6000
|
| 102 |
|
| 103 |
# Number of validation batches, -1 uses the entire validation set.
|
| 104 |
val_batches: 25
|
|
|
|
| 144 |
dropout: 0.05
|
| 145 |
|
| 146 |
# Schedule can only be specified in a config file, uncomment to use.
|
| 147 |
+
#lr_schedule:
|
| 148 |
+
# name: cosine_decay
|
| 149 |
+
# warmup: 100 # 0 for no warmup
|
| 150 |
+
# warmup_init: 1e-7 # 0 if not specified
|
| 151 |
+
# arguments: [1e-6, 1000, 1e-7] # passed to scheduler
|
| 152 |
```
|