| allow_cache: true |
| batch_size: 1 |
| config: ./ttsexamples/tacotron2/conf/tacotron2.v1.yaml |
| dev_dir: /content/dump_ljspeech/valid |
| end_ratio_value: 0.0 |
| eval_interval_steps: 50 |
| format: npy |
| gradient_accumulation_steps: 1 |
| hop_size: 256 |
| is_shuffle: true |
| log_interval_steps: 20 |
| max_char_length: 128 |
| max_mel_length: 257 |
| mel_length_threshold: 32 |
| mixed_precision: false |
| model_type: tacotron2 |
| num_save_intermediate_results: 1 |
| optimizer_params: {decay_steps: 150000, end_learning_rate: 1.0e-05, initial_learning_rate: 0.001, |
| warmup_proportion: 0.02, weight_decay: 0.001} |
| outdir: ./ttsexamples/tacotron2/exp/train.tacotron2.v1/ |
| pretrained: '' |
| remove_short_samples: true |
| resume: '' |
| save_interval_steps: 20 |
| schedule_decay_steps: 50000 |
| start_ratio_value: 0.5 |
| start_schedule_teacher_forcing: 200001 |
| tacotron2_params: {attention_dim: 128, attention_filters: 32, attention_kernel: 31, |
| attention_type: lsa, dataset: ljspeech, decoder_lstm_units: 1024, embedding_dropout_prob: 0.1, |
| embedding_hidden_size: 512, encoder_conv_activation: relu, encoder_conv_dropout_rate: 0.5, |
| encoder_conv_filters: 512, encoder_conv_kernel_sizes: 5, encoder_lstm_units: 256, |
| initializer_range: 0.02, n_conv_encoder: 5, n_conv_postnet: 5, n_lstm_decoder: 1, |
| n_mels: 80, n_prenet_layers: 2, n_speakers: 1, postnet_conv_filters: 512, postnet_conv_kernel_sizes: 5, |
| postnet_dropout_rate: 0.1, prenet_activation: relu, prenet_dropout_rate: 0.5, prenet_units: 256, |
| reduction_factor: 1} |
| train_dir: /content/dump_ljspeech/train |
| train_max_steps: 200000 |
| use_fal: false |
| use_fixed_shapes: true |
| use_norm: true |
| var_train_expr: null |
| verbose: 1 |
| version: '0.0' |
|
|