| base_config:
|
| - configs/singing/fs2.yaml
|
|
|
| audio_sample_rate: 24000
|
| hop_size: 128
|
| fft_size: 512
|
| win_size: 512
|
| fmin: 30
|
| fmax: 12000
|
| min_level_db: -120
|
|
|
| binarization_args:
|
| with_wav: true
|
| with_spk_embed: false
|
| with_align: true
|
| raw_data_dir: 'data/raw/popcs'
|
| processed_data_dir: 'data/processed/popcs'
|
| binary_data_dir: 'data/binary/popcs-pmf0'
|
| num_spk: 1
|
| datasets: [
|
| 'popcs',
|
| ]
|
| test_prefixes: [
|
| 'popcs-说散就散',
|
| 'popcs-隐形的翅膀',
|
| ]
|
|
|
| task_cls: tasks.tts.fs2.FastSpeech2Task
|
|
|
|
|
| vocoder: vocoders.hifigan.HifiGAN
|
| vocoder_ckpt: checkpoints/0109_hifigan_bigpopcs_hop128
|
| use_nsf: true
|
|
|
|
|
| max_tokens: 18000
|
| use_spk_embed: false
|
| num_valid_plots: 10
|
| max_updates: 160000
|
| save_gt: true
|
|
|
|
|
|
|
| |