Update README.md
Browse files
README.md
CHANGED
|
@@ -1,6 +1,6 @@
|
|
| 1 |
!deepspeed --module openrlhf.cli.train_dpo \
|
| 2 |
-
--save_path '/mnt/nvme1/will/
|
| 3 |
-
--ckpt_path '/mnt/nvme1/will/
|
| 4 |
--save_steps 50 \
|
| 5 |
--logging_steps 10 \
|
| 6 |
--eval_steps -1 \
|
|
@@ -12,7 +12,7 @@
|
|
| 12 |
--max_len 2048 \
|
| 13 |
--zero_stage 3 \
|
| 14 |
--learning_rate 5e-7 \
|
| 15 |
-
--dataset '/mnt/nvme1/will/
|
| 16 |
--apply_chat_template \
|
| 17 |
--chosen_key chosen \
|
| 18 |
--rejected_key rejected \
|
|
|
|
| 1 |
!deepspeed --module openrlhf.cli.train_dpo \
|
| 2 |
+
--save_path '/mnt/nvme1/will/8_dpo' \
|
| 3 |
+
--ckpt_path '/mnt/nvme1/will/8_dpo_ckpt' \
|
| 4 |
--save_steps 50 \
|
| 5 |
--logging_steps 10 \
|
| 6 |
--eval_steps -1 \
|
|
|
|
| 12 |
--max_len 2048 \
|
| 13 |
--zero_stage 3 \
|
| 14 |
--learning_rate 5e-7 \
|
| 15 |
+
--dataset '/mnt/nvme1/will/8_dpo_data' \
|
| 16 |
--apply_chat_template \
|
| 17 |
--chosen_key chosen \
|
| 18 |
--rejected_key rejected \
|