export WANDB_MODE=disabled export CUDA_LAUNCH_BLOCKING=0 DATASET=Instruments BASE_MODEL=/datain/v-yinju/llama-7b CKPT_PATH=/datain/v-yinju/rq-llama/v3-train/Instruments/first DATA_PATH=/datain/v-yinju/rqvae-zzx/data OUTPUT_DIR=$CKPT_PATH/finetune_more torchrun --nproc_per_node=8 --master_port=3324 continue_finetune.py \ --base_model $BASE_MODEL \ --ckpt_path $CKPT_PATH \ --output_dir $OUTPUT_DIR \ --dataset $DATASET \ --data_path $DATA_PATH \ --per_device_batch_size 6 \ --gradient_accumulation_steps 2 \ --learning_rate 5e-5 \ --epochs 4 \ --weight_decay 0.01 \ --save_and_eval_strategy epoch \ --fp16 \ --deepspeed ./config/ds_z2_fp16.json \ --dataloader_num_workers 4 \ --only_train_response \ --re_index 41 \ --tasks seqrec,itemsearch,preferenceobtain,item2index,index2item,fusionseqrec \ --train_prompt_sample_num 1,1,1,1,1,1 \ --train_data_sample_num 0,0,0,0,0,0 \ --index_file $CKPT_PATH/indices.json cd convert nohup ./convert.sh $OUTPUT_DIR >convert.log 2>&1 & cd ..