| | |
| |
|
| | defaults: |
| | - /solver/default |
| | - /model: score/basic |
| | - override /dset: audio/default |
| | - _self_ |
| |
|
| | solver: diffusion |
| |
|
| | sample_rate: ??? |
| | channels: ??? |
| | compression_model_checkpoint: ??? |
| | n_q: ??? |
| |
|
| |
|
| | dataset: |
| | batch_size: 128 |
| | num_workers: 10 |
| | segment_duration: 1 |
| | train: |
| | num_samples: 500000 |
| | valid: |
| | num_samples: 10000 |
| | evaluate: |
| | batch_size: 16 |
| | num_samples: 10000 |
| | generate: |
| | batch_size: 32 |
| | num_samples: 50 |
| | segment_duration: 10 |
| | audio: |
| | sample_rate: ${sample_rate} |
| |
|
| | loss: |
| | kind: mse |
| | norm_power: 0. |
| |
|
| | valid: |
| | every: 1 |
| |
|
| | evaluate: |
| | every: 20 |
| | num_workers: 5 |
| | metrics: |
| | visqol: false |
| | sisnr: false |
| | rvm: true |
| |
|
| | generate: |
| | every: 25 |
| | num_workers: 5 |
| |
|
| | checkpoint: |
| | save_last: true |
| | save_every: 25 |
| | keep_last: 10 |
| | keep_every_states: null |
| |
|
| |
|
| | optim: |
| | epochs: 20000 |
| | updates_per_epoch: 2000 |
| | lr: 2e-4 |
| | max_norm: 0 |
| | optimizer: adam |
| | adam: |
| | betas: [0.9, 0.999] |
| | weight_decay: 0. |
| | ema: |
| | use: true |
| | updates: 1 |
| | device: ${device} |
| | decay: 0.99 |
| |
|
| | processor: |
| | name: multi_band_processor |
| | use: false |
| | n_bands: 8 |
| | num_samples: 10_000 |
| | power_std: 1. |
| |
|
| | resampling: |
| | use: false |
| | target_sr: 16000 |
| |
|
| | filter: |
| | use: false |
| | n_bands: 4 |
| | idx_band: 0 |
| | cutoffs: null |
| |
|
| | schedule: |
| | repartition: "power" |
| | variable_step_batch: true |
| | beta_t0: 1.0e-5 |
| | beta_t1: 2.9e-2 |
| | beta_exp: 7.5 |
| | num_steps: 1000 |
| | variance: 'beta' |
| | clip: 5. |
| | rescale: 1. |
| | n_bands: null |
| | noise_scale: 1.0 |
| |
|
| | metrics: |
| | num_stage: 4 |
| |
|