File size: 965 Bytes
6f6529c
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
{
	"train": {
		"log_interval": 200,
		"seed": 1234,
		"learning_rate": 0.0001,
		"betas": [0.8, 0.99],
		"eps": 1e-9,
		"lr_decay": 0.999875,
		"segment_size": 17280,
		"c_mel": 45,
		"c_kl": 1.0
	},
	"data": {
		"max_wav_value": 32768.0,
		"sample_rate": 48000,
		"filter_length": 2048,
		"hop_length": 480,
		"win_length": 2048,
		"n_mel_channels": 128,
		"mel_fmin": 0.0,
		"mel_fmax": null
	},
	"model": {
		"inter_channels": 192,
		"hidden_channels": 192,
		"filter_channels": 768,
		"text_enc_hidden_dim": 768,
		"n_heads": 2,
		"n_layers": 6,
		"kernel_size": 3,
		"p_dropout": 0,
		"resblock": "1",
		"resblock_kernel_sizes": [3, 7, 11],
		"resblock_dilation_sizes": [
			[1, 3, 5],
			[1, 3, 5],
			[1, 3, 5]
		],
		"upsample_rates": [12, 10, 2, 2],
		"upsample_initial_channel": 512,
		"upsample_kernel_sizes": [24, 20, 4, 4],
		"use_spectral_norm": false,
		"gin_channels": 256,
		"spk_embed_dim": 109
	}
}