File size: 834 Bytes
18d2d5d
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
{
    "feature_extractor": {
        "class_path": "vocos.feature_extractors.EncodecFeatures",
        "init_args": {
            "encodec_model": "encodec_24khz",
            "bandwidths": [
                1.5,
                3.0,
                6.0,
                12.0
            ],
            "train_codebooks": false
        }
    },
    "backbone": {
        "class_path": "vocos.models.VocosBackbone",
        "init_args": {
            "input_channels": 128,
            "dim": 384,
            "intermediate_dim": 1152,
            "num_layers": 8,
            "adanorm_num_embeddings": 4
        }
    },
    "head": {
        "class_path": "vocos.heads.ISTFTHead",
        "init_args": {
            "dim": 384,
            "n_fft": 1280,
            "hop_length": 320,
            "padding": "same"
        }
    }
}