viks66 commited on
Commit
109bacd
·
1 Parent(s): 6d07c5e
exp/tts_stats_raw_char/train/feats_stats.npz ADDED
Binary file (1.4 kB). View file
 
exp/tts_train_transformer_raw_char/config.yaml ADDED
@@ -0,0 +1,306 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ config: conf/tuning/train_transformer.yaml
2
+ print_config: false
3
+ log_level: INFO
4
+ dry_run: false
5
+ iterator_type: sequence
6
+ output_dir: exp/tts_train_transformer_raw_char
7
+ ngpu: 1
8
+ seed: 0
9
+ num_workers: 1
10
+ num_att_plot: 3
11
+ dist_backend: nccl
12
+ dist_init_method: env://
13
+ dist_world_size: null
14
+ dist_rank: null
15
+ local_rank: 0
16
+ dist_master_addr: null
17
+ dist_master_port: null
18
+ dist_launcher: null
19
+ multiprocessing_distributed: false
20
+ unused_parameters: false
21
+ sharded_ddp: false
22
+ cudnn_enabled: true
23
+ cudnn_benchmark: false
24
+ cudnn_deterministic: true
25
+ collect_stats: false
26
+ write_collected_feats: false
27
+ max_epoch: 3000
28
+ patience: null
29
+ val_scheduler_criterion:
30
+ - valid
31
+ - loss
32
+ early_stopping_criterion:
33
+ - valid
34
+ - loss
35
+ - min
36
+ best_model_criterion:
37
+ - - valid
38
+ - loss
39
+ - min
40
+ - - train
41
+ - loss
42
+ - min
43
+ keep_nbest_models: 5
44
+ nbest_averaging_interval: 0
45
+ grad_clip: 1.0
46
+ grad_clip_type: 2.0
47
+ grad_noise: false
48
+ accum_grad: 2
49
+ no_forward_run: false
50
+ resume: true
51
+ train_dtype: float32
52
+ use_amp: false
53
+ log_interval: null
54
+ use_matplotlib: true
55
+ use_tensorboard: true
56
+ use_wandb: false
57
+ wandb_project: null
58
+ wandb_id: null
59
+ wandb_entity: null
60
+ wandb_name: null
61
+ wandb_model_log_interval: -1
62
+ detect_anomaly: false
63
+ pretrain_path: null
64
+ init_param: []
65
+ ignore_init_mismatch: false
66
+ freeze_param: []
67
+ num_iters_per_epoch: null
68
+ batch_size: 20
69
+ valid_batch_size: null
70
+ batch_bins: 640000
71
+ valid_batch_bins: null
72
+ train_shape_file:
73
+ - exp/tts_stats_raw_char/train/text_shape.char
74
+ - exp/tts_stats_raw_char/train/speech_shape
75
+ valid_shape_file:
76
+ - exp/tts_stats_raw_char/valid/text_shape.char
77
+ - exp/tts_stats_raw_char/valid/speech_shape
78
+ batch_type: numel
79
+ valid_batch_type: null
80
+ fold_length:
81
+ - 150
82
+ - 204800
83
+ sort_in_batch: descending
84
+ sort_batch: descending
85
+ multiple_iterator: false
86
+ chunk_length: 500
87
+ chunk_shift_ratio: 0.5
88
+ num_cache_chunks: 1024
89
+ train_data_path_and_name_and_type:
90
+ - - dump/raw/train/text
91
+ - text
92
+ - text
93
+ - - dump/raw/train/wav.scp
94
+ - speech
95
+ - sound
96
+ valid_data_path_and_name_and_type:
97
+ - - dump/raw/dev/text
98
+ - text
99
+ - text
100
+ - - dump/raw/dev/wav.scp
101
+ - speech
102
+ - sound
103
+ allow_variable_data_keys: false
104
+ max_cache_size: 0.0
105
+ max_cache_fd: 32
106
+ valid_max_cache_size: null
107
+ optim: adam
108
+ optim_conf:
109
+ lr: 1.0
110
+ scheduler: noamlr
111
+ scheduler_conf:
112
+ model_size: 512
113
+ warmup_steps: 8000
114
+ token_list:
115
+ - <blank>
116
+ - <unk>
117
+ - <space>
118
+ - ा
119
+ - ्
120
+ - र
121
+ - े
122
+ - त
123
+ - य
124
+ - ी
125
+ - क
126
+ - ल
127
+ - न
128
+ - स
129
+ - ि
130
+ - व
131
+ - ं
132
+ - म
133
+ - च
134
+ - ह
135
+ - प
136
+ - ो
137
+ - ण
138
+ - द
139
+ - ज
140
+ - ु
141
+ - आ
142
+ - ग
143
+ - ट
144
+ - श
145
+ - ब
146
+ - ड
147
+ - ','
148
+ - अ
149
+ - ू
150
+ - ध
151
+ - ळ
152
+ - ष
153
+ - .
154
+ - ख
155
+ - भ
156
+ - फ
157
+ - थ
158
+ - ठ
159
+ - घ
160
+ - ॉ
161
+ - ए
162
+ - झ
163
+ - उ
164
+ - ॅ
165
+ - इ
166
+ - ई
167
+ - ढ
168
+ - ै
169
+ - ँ
170
+ - ृ
171
+ - ऊ
172
+ - ौ
173
+ - १
174
+ - ऱ
175
+ - ''''
176
+ - ओ
177
+ - ०
178
+ - २
179
+ - ऑ
180
+ - छ
181
+ - ञ
182
+ - य़
183
+ - ३
184
+ - ५
185
+ - ४
186
+ - ९
187
+ - ६
188
+ - ८
189
+ - '"'
190
+ - औ
191
+ - ७
192
+ - ऐ
193
+ - '?'
194
+ - ऍ
195
+ - ॥
196
+ - फ़
197
+ - ऋ
198
+ - ः
199
+ - ़
200
+ - ।
201
+ - '-'
202
+ - ड़
203
+ - ङ
204
+ - ऽ
205
+ - ':'
206
+ - ज़
207
+ - ॄ
208
+ - क़
209
+ - ॊ
210
+ - ‘
211
+ - ’
212
+ - ढ़
213
+ - /
214
+ - ऎ
215
+ - ॆ
216
+ - ॐ
217
+ - ग़
218
+ - '!'
219
+ - ॠ
220
+ - ऩ
221
+ - ख़
222
+ - ऒ
223
+ - o
224
+ - ऴ
225
+ - (
226
+ - )
227
+ - ;
228
+ - <sos/eos>
229
+ odim: null
230
+ model_conf: {}
231
+ use_preprocessor: true
232
+ token_type: char
233
+ bpemodel: null
234
+ non_linguistic_symbols: null
235
+ cleaner: null
236
+ g2p: null
237
+ feats_extract: fbank
238
+ feats_extract_conf:
239
+ n_fft: 1024
240
+ hop_length: 256
241
+ win_length: null
242
+ fs: 22050
243
+ fmin: 0
244
+ fmax: 8000
245
+ n_mels: 80
246
+ normalize: global_mvn
247
+ normalize_conf:
248
+ stats_file: exp/tts_stats_raw_char/train/feats_stats.npz
249
+ tts: transformer
250
+ tts_conf:
251
+ embed_dim: 0
252
+ eprenet_conv_layers: 0
253
+ eprenet_conv_filts: 0
254
+ eprenet_conv_chans: 0
255
+ dprenet_layers: 2
256
+ dprenet_units: 256
257
+ adim: 512
258
+ aheads: 8
259
+ elayers: 6
260
+ eunits: 1024
261
+ dlayers: 6
262
+ dunits: 1024
263
+ positionwise_layer_type: conv1d
264
+ positionwise_conv_kernel_size: 1
265
+ postnet_layers: 5
266
+ postnet_filts: 5
267
+ postnet_chans: 256
268
+ use_masking: true
269
+ bce_pos_weight: 5.0
270
+ use_scaled_pos_enc: true
271
+ encoder_normalize_before: true
272
+ decoder_normalize_before: true
273
+ reduction_factor: 1
274
+ init_type: xavier_uniform
275
+ init_enc_alpha: 1.0
276
+ init_dec_alpha: 1.0
277
+ eprenet_dropout_rate: 0.0
278
+ dprenet_dropout_rate: 0.5
279
+ postnet_dropout_rate: 0.5
280
+ transformer_enc_dropout_rate: 0.1
281
+ transformer_enc_positional_dropout_rate: 0.1
282
+ transformer_enc_attn_dropout_rate: 0.1
283
+ transformer_dec_dropout_rate: 0.1
284
+ transformer_dec_positional_dropout_rate: 0.1
285
+ transformer_dec_attn_dropout_rate: 0.1
286
+ transformer_enc_dec_attn_dropout_rate: 0.1
287
+ use_guided_attn_loss: true
288
+ num_heads_applied_guided_attn: 2
289
+ num_layers_applied_guided_attn: 2
290
+ modules_applied_guided_attn:
291
+ - encoder-decoder
292
+ guided_attn_loss_sigma: 0.4
293
+ guided_attn_loss_lambda: 10.0
294
+ pitch_extract: null
295
+ pitch_extract_conf: {}
296
+ pitch_normalize: null
297
+ pitch_normalize_conf: {}
298
+ energy_extract: null
299
+ energy_extract_conf: {}
300
+ energy_normalize: null
301
+ energy_normalize_conf: {}
302
+ required:
303
+ - output_dir
304
+ - token_list
305
+ version: 0.10.7a1
306
+ distributed: false
exp/tts_train_transformer_raw_char/valid.loss.ave_5best.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:936c11683afdc4de0992d22d11aba1c08b6c72d72d08b0283de7befc5a63119e
3
+ size 132498531