| |
|
|
| compression_model: encodec |
|
|
| encodec: |
| autoencoder: seanet |
| quantizer: rvq |
| sample_rate: ${sample_rate} |
| channels: ${channels} |
| causal: false |
| renormalize: false |
|
|
| seanet: |
| dimension: 128 |
| channels: ${channels} |
| causal: ${encodec.causal} |
| n_filters: 32 |
| n_residual_layers: 1 |
| ratios: [8, 5, 4, 2] |
| activation: ELU |
| activation_params: {"alpha": 1.} |
| norm: weight_norm |
| norm_params: {} |
| kernel_size: 7 |
| residual_kernel_size: 3 |
| last_kernel_size: 7 |
| dilation_base: 2 |
| pad_mode: constant |
| true_skip: true |
| compress: 2 |
| lstm: 2 |
| disable_norm_outer_blocks: 0 |
| |
| |
| |
| |
| decoder: |
| trim_right_ratio: 1.0 |
| final_activation: null |
| final_activation_params: null |
| encoder: {} |
|
|
| rvq: |
| n_q: 8 |
| q_dropout: false |
| bins: 1024 |
| decay: 0.99 |
| kmeans_init: true |
| kmeans_iters: 50 |
| threshold_ema_dead_code: 2 |
| orthogonal_reg_weight: 0.0 |
| orthogonal_reg_active_codes_only: false |
|
|
| no_quant: {} |
|
|