lglg666's picture
Upload folder using huggingface_hub
6766eda verified
pip install torch_complex
model_path=MODEL_PATH
data_path=DATA_PATH
label_path=LABEL_PATH
train_subset=train_960
valid_subset=valid
distributed_world_size=WORLD_SIZE
update_freq=$((32/$WORLD_SIZE))
max_tokens=1400000
warmup_updates=32000
total_num_update=400000
mkdir -p ${model_path}
python train.py \
--ddp-backend no_c10d \
--distributed-backend 'nccl' \
--distributed-world-size ${distributed_world_size} \
--distributed-port 29671 \
--nprocs-per-node 8 \
--find-unused-parameters \
--fp16 \
--log-format json \
--log-interval 200 \
--seed 1337 \
--save-dir ${model_path} \
--save-interval-updates 5000 \
--keep-interval-updates 10 \
--no-epoch-checkpoints \
--num-workers 6 \
--task hubert_pretraining \
--criterion hubert \
--arch ils_hubert \
--train-subset ${train_subset} \
--valid-subset ${valid_subset} \
--log-keys '[]' \
${data_path} \
--label-dir ${label_path} \
--labels '["km"]' \
--sample-rate 16000 \
--max-sample-size 250000 \
--min-sample-size 32000 \
--max-tokens ${max_tokens} \
--skip-invalid-size-inputs-valid-test \
--validate-interval 5 \
--validate-interval-updates 10000 \
--pred-masked-weight 1.0 \
--pred-nomask-weight 0.0 \
--loss-weights [10,] \
--label-rate 50 \
--mask-prob 0.80 \
--extractor-mode default \
--conv-feature-layers '[(512,10,5)] + [(512,3,2)] * 4 + [(512,2,2)] * 2' \
--final-dim 256 \
--encoder-layerdrop 0.05 \
--dropout-input 0.1 \
--dropout-features 0.1 \
--dropout 0.1 \
--attention-dropout 0.1 \
--feature-grad-mult 0.1 \
--activation-dropout 0.0 \
--optimizer adam \
--adam-betas '(0.9,0.98)' \
--adam-eps 1e-06 \
--weight-decay 0.01 \
--lr-scheduler polynomial_decay \
--warmup-updates ${warmup_updates} \
--total-num-update ${total_num_update} \
--max-update 400000 \
--lr 0.0005 \
--clip-norm 10.0 \
--update-freq ${update_freq} \
--predict-layers "[4,12]" \
--relative-position-embedding \
--num-buckets 320 \
--max-distance 800 \
--required-batch-size-multiple 1 \
--separate-label-embeds