File size: 627 Bytes
0ce6f0d 27de6d7 0ce6f0d 27de6d7 0ce6f0d | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 | backbone:
class_path: vocos.models.VocosBackbone
init_args:
adanorm_num_embeddings: null
dim: 384
input_channels: 1024
intermediate_dim: 1152
layer_scale_init_value: null
num_layers: 8
decay_mel_coeff: false
evaluate_periodicty: true
evaluate_pesq: true
evaluate_utmos: true
feature_extractor:
class_path: vocos.feature_extractors.DACFeatures
head:
class_path: vocos.heads.ISTFTHead
init_args:
dim: 384
hop_length: 320
n_fft: 1280
padding: same
initial_learning_rate: 0.0005
mel_loss_coeff: 45.0
mrd_loss_coeff: 1.0
num_warmup_steps: 0
pretrain_mel_steps: 0
sample_rate: 16000
|