| name: predictive_conformer |
|
|
| model: |
| type: predictive |
| sample_rate: 16000 |
| skip_nan_grad: false |
| num_outputs: 1 |
| |
| normalize_input: true |
|
|
| train_ds: |
| shar_path: ??? |
| use_lhotse: true |
| truncate_duration: 4.09 |
| truncate_offset_type: random |
| batch_size: 64 |
| shuffle: true |
| num_workers: 8 |
| pin_memory: true |
|
|
| validation_ds: |
| manifest_filepath: ??? |
| input_key: noisy_filepath |
| target_key: clean_filepath |
| batch_size: 8 |
| shuffle: false |
| num_workers: 4 |
| pin_memory: true |
|
|
| encoder: |
| _target_: nemo.collections.audio.modules.transforms.AudioToSpectrogram |
| fft_length: 510 |
| hop_length: 128 |
| magnitude_power: 0.5 |
| scale: 0.33 |
|
|
| decoder: |
| _target_: nemo.collections.audio.modules.transforms.SpectrogramToAudio |
| fft_length: ${model.encoder.fft_length} |
| hop_length: ${model.encoder.hop_length} |
| magnitude_power: ${model.encoder.magnitude_power} |
| scale: ${model.encoder.scale} |
|
|
| estimator: |
| _target_: nemo.collections.audio.parts.submodules.conformer.SpectrogramConformer |
| in_channels: 1 |
| out_channels: 1 |
| feat_in: 256 |
| n_layers: 8 |
| d_model: 512 |
| subsampling_factor: 1 |
| self_attention_model: 'rel_pos' |
| n_heads: 8 |
| |
| |
| conv_context_size: null |
| conv_norm_type: 'layer_norm' |
| causal_downsampling: False |
| att_context_size: [-1, -1] |
| att_context_style: 'regular' |
| |
| loss: |
| _target_: nemo.collections.audio.losses.MSELoss |
|
|
| metrics: |
| val: |
| sisdr: |
| _target_: torchmetrics.audio.ScaleInvariantSignalDistortionRatio |
| |
| optim: |
| name: adamw |
| lr: 1e-3 |
| |
| betas: [0.9, 0.98] |
| weight_decay: 1e-3 |
|
|
| |
| sched: |
| name: CosineAnnealing |
| |
| warmup_steps: null |
| warmup_ratio: 0.1 |
| min_lr: 1e-5 |
|
|
| trainer: |
| devices: -1 |
| num_nodes: 1 |
| max_epochs: -1 |
| max_steps: ??? |
| limit_train_batches: ??? |
| val_check_interval: ??? |
| accelerator: auto |
| strategy: ddp |
| use_distributed_sampler: false |
| accumulate_grad_batches: 1 |
| gradient_clip_val: null |
| precision: 32 |
| log_every_n_steps: 100 |
| enable_progress_bar: true |
| num_sanity_val_steps: 0 |
| check_val_every_n_epoch: null |
| sync_batchnorm: true |
| enable_checkpointing: false |
| logger: false |
|
|
| exp_manager: |
| exp_dir: null |
| name: ${name} |
|
|
| |
| create_tensorboard_logger: true |
|
|
| |
| create_checkpoint_callback: true |
| checkpoint_callback_params: |
| |
| monitor: val_sisdr |
| mode: max |
| save_top_k: 5 |
| always_save_nemo: true |
|
|
| |
| create_early_stopping_callback: true |
| early_stopping_callback_params: |
| monitor: val_sisdr |
| mode: max |
| min_delta: 0.0 |
| patience: 20 |
| verbose: true |
| strict: false |
|
|
| resume_from_checkpoint: null |
| |
| resume_if_exists: false |
| resume_ignore_no_checkpoint: false |
|
|
| |
| create_wandb_logger: false |
| wandb_logger_kwargs: |
| name: null |
| project: null |
|
|