| { | |
| "encoder_dim": 64, | |
| "encoder_rates": [ | |
| 2, | |
| 8, | |
| 10, | |
| 12 | |
| ], | |
| "latent_dim": 1024, | |
| "decoder_dim": 1536, | |
| "decoder_rates": [ | |
| 12, | |
| 10, | |
| 8, | |
| 2 | |
| ], | |
| "n_codebooks": 16, | |
| "codebook_size": 1024, | |
| "codebook_dim": 128, | |
| "quantizer_dropout": false, | |
| "sample_rate": 48000 | |
| } |
| { | |
| "encoder_dim": 64, | |
| "encoder_rates": [ | |
| 2, | |
| 8, | |
| 10, | |
| 12 | |
| ], | |
| "latent_dim": 1024, | |
| "decoder_dim": 1536, | |
| "decoder_rates": [ | |
| 12, | |
| 10, | |
| 8, | |
| 2 | |
| ], | |
| "n_codebooks": 16, | |
| "codebook_size": 1024, | |
| "codebook_dim": 128, | |
| "quantizer_dropout": false, | |
| "sample_rate": 48000 | |
| } |