Student0809's picture
Add files using upload-large-folder tool
cb2428f verified
# Train
CUDA_VISIBLE_DEVICES=0 \
swift sft \
--model Qwen/Qwen2-1.5B-Instruct \
--train_type lora \
--dataset 'swift/self-cognition#1000' \
--num_train_epochs 1 \
--per_device_train_batch_size 1 \
--learning_rate 1e-4 \
--lora_rank 8 \
--lora_alpha 32 \
--init_weights lora-ga \
--lora_ga_batch_size 2 \
--lora_ga_iters 2 \
--lora_ga_max_length 1024 \
--lora_ga_direction ArB2r \
--lora_ga_scale stable \
--lora_ga_stable_gamma 16 \
--gradient_accumulation_steps 16 \
--eval_steps 100 \
--save_steps 100 \
--save_total_limit 2 \
--logging_steps 5 \
--model_author swift \
--model_name swift-robot
# Infer
# swift infer \
# --model Qwen/Qwen2-1.5B-Instruct \
# --ckpt_dir ./output/Qwen2-1.5B-Instruct/v0-20241214-191235/checkpoint-62/converted/default \
# --infer_backend pt \
# --stream true \
# --max_new_tokens 2048