yuccaaa commited on
Commit
3a93fb8
·
verified ·
1 Parent(s): a7c0ea3

Upload ms-swift/examples/eval/train_eval/train.sh with huggingface_hub

Browse files
ms-swift/examples/eval/train_eval/train.sh ADDED
@@ -0,0 +1,24 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ CUDA_VISIBLE_DEVICES=0 \
2
+ swift sft \
3
+ --model "Qwen/Qwen2.5-0.5B-Instruct" \
4
+ --train_type "lora" \
5
+ --dataset "AI-ModelScope/alpaca-gpt4-data-zh#100" \
6
+ --torch_dtype "bfloat16" \
7
+ --num_train_epochs "1" \
8
+ --per_device_train_batch_size "1" \
9
+ --learning_rate "1e-4" \
10
+ --lora_rank "8" \
11
+ --lora_alpha "32" \
12
+ --target_modules "all-linear" \
13
+ --gradient_accumulation_steps "16" \
14
+ --save_steps "50" \
15
+ --save_total_limit "5" \
16
+ --logging_steps "5" \
17
+ --max_length "2048" \
18
+ --eval_strategy "steps" \
19
+ --eval_steps "5" \
20
+ --per_device_eval_batch_size "5" \
21
+ --eval_use_evalscope \
22
+ --eval_datasets "gsm8k" \
23
+ --eval_datasets_args '{"gsm8k": {"few_shot_num": 0}}' \
24
+ --eval_limit "10"