Create README.md
Browse files
README.md
ADDED
|
@@ -0,0 +1,19 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
!deepspeed --module openrlhf.cli.train_dpo \
|
| 2 |
+
--save_path '/mnt/nvme1/will/3_dpo' \
|
| 3 |
+
--save_steps 1024 \
|
| 4 |
+
--logging_steps 10 \
|
| 5 |
+
--eval_steps -1 \
|
| 6 |
+
--train_batch_size 512 \
|
| 7 |
+
--micro_train_batch_size 2 \
|
| 8 |
+
--pretrain 'mistralai/Mistral-Nemo-Instruct-2407' \
|
| 9 |
+
--bf16 \
|
| 10 |
+
--max_epochs 1 \
|
| 11 |
+
--max_len 2048 \
|
| 12 |
+
--zero_stage 3 \
|
| 13 |
+
--learning_rate 5e-6 \
|
| 14 |
+
--dataset '/mnt/nvme1/will/2_dpo' \
|
| 15 |
+
--apply_chat_template \
|
| 16 |
+
--chosen_key chosen \
|
| 17 |
+
--rejected_key rejected \
|
| 18 |
+
--flash_attn \
|
| 19 |
+
--gradient_checkpointing
|