zhenzhe commited on
Commit
f5c9257
·
verified ·
1 Parent(s): dc11e33

Update README.md

Browse files
Files changed (1) hide show
  1. README.md +3 -3
README.md CHANGED
@@ -1,6 +1,6 @@
1
  !deepspeed --module openrlhf.cli.train_dpo \
2
- --save_path '/mnt/nvme1/will/7_dpo' \
3
- --ckpt_path '/mnt/nvme1/will/7_dpo_ckpt' \
4
  --save_steps 50 \
5
  --logging_steps 10 \
6
  --eval_steps -1 \
@@ -12,7 +12,7 @@
12
  --max_len 2048 \
13
  --zero_stage 3 \
14
  --learning_rate 5e-7 \
15
- --dataset '/mnt/nvme1/will/7_dpo_data' \
16
  --apply_chat_template \
17
  --chosen_key chosen \
18
  --rejected_key rejected \
 
1
  !deepspeed --module openrlhf.cli.train_dpo \
2
+ --save_path '/mnt/nvme1/will/8_dpo' \
3
+ --ckpt_path '/mnt/nvme1/will/8_dpo_ckpt' \
4
  --save_steps 50 \
5
  --logging_steps 10 \
6
  --eval_steps -1 \
 
12
  --max_len 2048 \
13
  --zero_stage 3 \
14
  --learning_rate 5e-7 \
15
+ --dataset '/mnt/nvme1/will/8_dpo_data' \
16
  --apply_chat_template \
17
  --chosen_key chosen \
18
  --rejected_key rejected \