zhenzhe commited on
Commit
5c5d70c
·
verified ·
1 Parent(s): 2f732fa

Create README.md

Browse files
Files changed (1) hide show
  1. README.md +27 -0
README.md ADDED
@@ -0,0 +1,27 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ !deepspeed kto.py \
2
+ --save_path '/root/chai/kto' \
3
+ --save_steps 50 \
4
+ --logging_steps 10 \
5
+ --eval_steps -1 \
6
+ --train_batch_size 256 \
7
+ --micro_train_batch_size 1 \
8
+ --pretrain '/root/chai/mistralai/Mistral-Nemo-Instruct-2407' \
9
+ --bf16 \
10
+ --max_epochs 1 \
11
+ --max_len 1348 \
12
+ --zero_stage 2 \
13
+ --learning_rate 5e-7 \
14
+ --dataset '/root/chai/1_kto' \
15
+ --input_key instruction \
16
+ --output_key response \
17
+ --label_key score \
18
+ --flash_attn \
19
+ --beta 0.1 \
20
+ --max_samples 100000 \
21
+ --gradient_checkpointing \
22
+ --lora_rank 16 \
23
+ --lora_alpha 32 \
24
+ --lora_dropout 0.05
25
+ # --use_ms False
26
+
27
+ # Dylan2048/ultrafeedback-unpaired-preferences