Create README.md
Browse files
README.md
ADDED
|
@@ -0,0 +1,27 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
!deepspeed kto.py \
|
| 2 |
+
--save_path '/root/chai/kto' \
|
| 3 |
+
--save_steps 50 \
|
| 4 |
+
--logging_steps 10 \
|
| 5 |
+
--eval_steps -1 \
|
| 6 |
+
--train_batch_size 256 \
|
| 7 |
+
--micro_train_batch_size 1 \
|
| 8 |
+
--pretrain '/root/chai/mistralai/Mistral-Nemo-Instruct-2407' \
|
| 9 |
+
--bf16 \
|
| 10 |
+
--max_epochs 1 \
|
| 11 |
+
--max_len 1348 \
|
| 12 |
+
--zero_stage 2 \
|
| 13 |
+
--learning_rate 5e-7 \
|
| 14 |
+
--dataset '/root/chai/1_kto' \
|
| 15 |
+
--input_key instruction \
|
| 16 |
+
--output_key response \
|
| 17 |
+
--label_key score \
|
| 18 |
+
--flash_attn \
|
| 19 |
+
--beta 0.1 \
|
| 20 |
+
--max_samples 100000 \
|
| 21 |
+
--gradient_checkpointing \
|
| 22 |
+
--lora_rank 16 \
|
| 23 |
+
--lora_alpha 32 \
|
| 24 |
+
--lora_dropout 0.05
|
| 25 |
+
# --use_ms False
|
| 26 |
+
|
| 27 |
+
# Dylan2048/ultrafeedback-unpaired-preferences
|