Update README.md
Browse files
README.md
CHANGED
|
@@ -59,12 +59,12 @@ trainer = SFTTrainer(
|
|
| 59 |
max_steps=10000,
|
| 60 |
learning_rate=1e-4,
|
| 61 |
logging_steps=1,
|
| 62 |
-
output_dir="
|
| 63 |
optim="paged_adamw_32bit",report_to="none"
|
| 64 |
)
|
| 65 |
)
|
| 66 |
trainer.train()
|
| 67 |
-
trainer.model.save_pretrained("
|
| 68 |
-
trainer.tokenizer.save_pretrained("
|
| 69 |
|
| 70 |
```
|
|
|
|
| 59 |
max_steps=10000,
|
| 60 |
learning_rate=1e-4,
|
| 61 |
logging_steps=1,
|
| 62 |
+
output_dir="1B_outputs", overwrite_output_dir=True,save_steps=1000,
|
| 63 |
optim="paged_adamw_32bit",report_to="none"
|
| 64 |
)
|
| 65 |
)
|
| 66 |
trainer.train()
|
| 67 |
+
trainer.model.save_pretrained("1B-final", dtype=torch.float32)
|
| 68 |
+
trainer.tokenizer.save_pretrained("1B-final")
|
| 69 |
|
| 70 |
```
|