Spaces:
Running
on
Zero
Running
on
Zero
| export CUDA_VISIBLE_DEVICES=0 | |
| SAVE_DIR='./pretrain_data' # to save processed data | |
| CACHE_DIR='./cache' # to save dataset cache | |
| MLS_WAV_DIR='' # downloaded mls wav path | |
| LIBRITTSRMIX_WAV_DIR='' # downloaded librittsrmix wav path | |
| GIGASPEECH_WAV_DIR='' # downloaded gigaspeech wav path | |
| COMMONVOICE_WAV_DIR='' # downloaded commonvoice wav path | |
| EMILIA_WAV_DIR='' # downloaded emilia wav path | |
| CPUS=30 | |
| N_WORKERS=8 | |
| BATCH_SIZE=64 | |
| HUB='OpenSound/CapSpeech' | |
| python preprocess_pretrain.py \ | |
| --hub ${HUB} \ | |
| --save_dir ${SAVE_DIR} \ | |
| --cache_dir ${CACHE_DIR} \ | |
| --libriRmix_wav_dir ${LIBRITTSRMIX_WAV_DIR}\ | |
| --mls_wav_dir ${MLS_WAV_DIR} \ | |
| --commonvoice_dir ${COMMONVOICE_WAV_DIR} \ | |
| --gigaspeech_dir ${GIGASPEECH_WAV_DIR} \ | |
| --emilia_dir ${EMILIA_WAV_DIR} \ | |
| --splits train_PT validation_PT \ | |
| --audio_min_length 3.0 \ | |
| --audio_max_length 18.0 | |
| python phonemize.py \ | |
| --save_dir ${SAVE_DIR} \ | |
| --num_cpus ${CPUS} | |
| python caption.py \ | |
| --save_dir ${SAVE_DIR} | |
| python filemaker.py \ | |
| --save_dir ${SAVE_DIR} | |
| python vocab.py \ | |
| --save_dir ${SAVE_DIR} | |