zhenzhe commited on
Commit
17bf88a
·
verified ·
1 Parent(s): c3fdc96

Create README.md

Browse files
Files changed (1) hide show
  1. README.md +19 -0
README.md ADDED
@@ -0,0 +1,19 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ !deepspeed --module openrlhf.cli.train_dpo \
2
+ --save_path '/mnt/nvme1/will/3_dpo' \
3
+ --save_steps 1024 \
4
+ --logging_steps 10 \
5
+ --eval_steps -1 \
6
+ --train_batch_size 512 \
7
+ --micro_train_batch_size 2 \
8
+ --pretrain 'mistralai/Mistral-Nemo-Instruct-2407' \
9
+ --bf16 \
10
+ --max_epochs 1 \
11
+ --max_len 2048 \
12
+ --zero_stage 3 \
13
+ --learning_rate 5e-6 \
14
+ --dataset '/mnt/nvme1/will/2_dpo' \
15
+ --apply_chat_template \
16
+ --chosen_key chosen \
17
+ --rejected_key rejected \
18
+ --flash_attn \
19
+ --gradient_checkpointing