File size: 666 Bytes
7d4a6e1 482032d 6322eb3 7d4a6e1 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 |
{
"_name_or_path": "TuKoResearch/WavCochV8192",
"architectures": ["WavCoch"],
"model_type": "WavCoch.WavCoch",
"auto_map": {
"AutoConfig": "configuration_wavcoch.WavCochConfig",
"AutoTokenizer": "modeling_wavcoch.WavCoch",
"AutoModel": "modeling_wavcoch.WavCoch"
},
"window_size": 1001,
"hop_length": 80,
"encoder_layers": 8,
"encoder_dim": 512,
"encoder_kernel_size": 3,
"decoder_layers": 8,
"decoder_dim": 512,
"decoder_kernel_size": 9,
"entropy_loss_weight": 0.001,
"commit_loss_weight": 0.001,
"diversity_gamma": 1.0,
"codebook_size": 8192,
"vocab_size": 8192,
"quantizer": "FSQ",
"channels": [8, 8, 8, 4, 4]
} |