Spaces:
Sleeping
Sleeping
File size: 1,231 Bytes
1c43d7b |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 |
#!/bin/bash
# Copyright 2024 Alibaba Inc. All Rights Reserved.
pretrained_model_dir=./pretrained_models/CosyVoice2-0.5B
# train llm
export CUDA_VISIBLE_DEVICES="0,1,2,3"
num_gpus=$(echo $CUDA_VISIBLE_DEVICES | awk -F "," '{print NF}')
job_id=1986
dist_backend="nccl"
num_workers=24
prefetch=100
train_engine=torch_ddp
model=llm
torchrun --nnodes=1 --nproc_per_node=$num_gpus --rdzv_id=$job_id --rdzv_backend="c10d" --rdzv_endpoint="localhost:1234" \
train.py \
--train_engine $train_engine \
--config config.yaml \
--train_data ./data.list \
--cv_data ./data.list \
--qwen_pretrain_path $pretrained_model_dir/CosyVoice-BlankEN \
--model $model \
--model_dir /data/checkpoint/$model/ \
--num_workers ${num_workers} \
--prefetch ${prefetch} \
--use_amp \
--pretrained_model ./pretrained_models/CosyVoice2-0.5B/llm.pt
# torchrun --nproc_per_node=4 --nnodes=1 --rdzv_id=2024 --rdzv_backend="c10d" --rdzv_endpoint="localhost:0" `which s3tokenizer` --root_path /data/dataset/ \
# --model speech_tokenizer_v2_25hz \
# --device "cuda" \
# --batch_size 64 \
# --file_list /data/learnable-speech/speech/files.txt \
# --skip_existing |