| pip install torch_complex | |
| model_path=MODEL_PATH | |
| data_path=DATA_PATH | |
| label_path=LABEL_PATH | |
| train_subset=train_960 | |
| valid_subset=valid | |
| distributed_world_size=WORLD_SIZE | |
| update_freq=$((32/$WORLD_SIZE)) | |
| max_tokens=1400000 | |
| warmup_updates=32000 | |
| total_num_update=400000 | |
| mkdir -p ${model_path} | |
| python train.py \ | |
| --ddp-backend no_c10d \ | |
| --distributed-backend 'nccl' \ | |
| --distributed-world-size ${distributed_world_size} \ | |
| --distributed-port 29671 \ | |
| --nprocs-per-node 8 \ | |
| --find-unused-parameters \ | |
| --fp16 \ | |
| --log-format json \ | |
| --log-interval 200 \ | |
| --seed 1337 \ | |
| --save-dir ${model_path} \ | |
| --save-interval-updates 5000 \ | |
| --keep-interval-updates 10 \ | |
| --no-epoch-checkpoints \ | |
| --num-workers 6 \ | |
| --task hubert_pretraining \ | |
| --criterion hubert \ | |
| --arch ils_hubert \ | |
| --train-subset ${train_subset} \ | |
| --valid-subset ${valid_subset} \ | |
| --log-keys '[]' \ | |
| ${data_path} \ | |
| --label-dir ${label_path} \ | |
| --labels '["km"]' \ | |
| --sample-rate 16000 \ | |
| --max-sample-size 250000 \ | |
| --min-sample-size 32000 \ | |
| --max-tokens ${max_tokens} \ | |
| --skip-invalid-size-inputs-valid-test \ | |
| --validate-interval 5 \ | |
| --validate-interval-updates 10000 \ | |
| --pred-masked-weight 1.0 \ | |
| --pred-nomask-weight 0.0 \ | |
| --loss-weights [10,] \ | |
| --label-rate 50 \ | |
| --mask-prob 0.80 \ | |
| --extractor-mode default \ | |
| --conv-feature-layers '[(512,10,5)] + [(512,3,2)] * 4 + [(512,2,2)] * 2' \ | |
| --final-dim 256 \ | |
| --encoder-layerdrop 0.05 \ | |
| --dropout-input 0.1 \ | |
| --dropout-features 0.1 \ | |
| --dropout 0.1 \ | |
| --attention-dropout 0.1 \ | |
| --feature-grad-mult 0.1 \ | |
| --activation-dropout 0.0 \ | |
| --optimizer adam \ | |
| --adam-betas '(0.9,0.98)' \ | |
| --adam-eps 1e-06 \ | |
| --weight-decay 0.01 \ | |
| --lr-scheduler polynomial_decay \ | |
| --warmup-updates ${warmup_updates} \ | |
| --total-num-update ${total_num_update} \ | |
| --max-update 400000 \ | |
| --lr 0.0005 \ | |
| --clip-norm 10.0 \ | |
| --update-freq ${update_freq} \ | |
| --predict-layers "[4,12]" \ | |
| --relative-position-embedding \ | |
| --num-buckets 320 \ | |
| --max-distance 800 \ | |
| --required-batch-size-multiple 1 \ | |
| --separate-label-embeds | |