| seed: 12345 | |
| train: true | |
| ignore_warnings: true | |
| print_config: false | |
| work_dir: ${hydra:runtime.cwd} | |
| logs_dir: ${work_dir}${oc.env:DIR_LOGS} | |
| data_dir: ${work_dir}${oc.env:DIR_DATA} | |
| ckpt_dir: ${logs_dir}/ckpts/${now:%Y-%m-%d-%H-%M-%S} | |
| module: main.module_base | |
| batch_size: 1 | |
| accumulate_grad_batches: 32 | |
| num_workers: 8 | |
| sampling_rate: 44100 | |
| length: 32768 | |
| channels: 2 | |
| log_every_n_steps: 1000 | |
| model: | |
| _target_: ${module}.Model | |
| lr: 0.0001 | |
| lr_beta1: 0.95 | |
| lr_beta2: 0.999 | |
| lr_eps: 1.0e-06 | |
| lr_weight_decay: 0.001 | |
| ema_beta: 0.995 | |
| ema_power: 0.7 | |
| model: | |
| _target_: main.DiffusionModel | |
| net_t: | |
| _target_: ${module}.UNetT | |
| in_channels: 2 | |
| channels: | |
| - 32 | |
| - 32 | |
| - 64 | |
| - 64 | |
| - 128 | |
| - 128 | |
| - 256 | |
| - 256 | |
| factors: | |
| - 1 | |
| - 2 | |
| - 2 | |
| - 2 | |
| - 2 | |
| - 2 | |
| - 2 | |
| - 2 | |
| items: | |
| - 2 | |
| - 2 | |
| - 2 | |
| - 2 | |
| - 2 | |
| - 2 | |
| - 4 | |
| - 4 | |
| attentions: | |
| - 0 | |
| - 0 | |
| - 0 | |
| - 0 | |
| - 0 | |
| - 1 | |
| - 1 | |
| - 1 | |
| attention_heads: 8 | |
| attention_features: 64 | |
| datamodule: | |
| _target_: main.module_base.Datamodule | |
| dataset: | |
| _target_: audio_data_pytorch.WAVDataset | |
| path: ./data/wav_dataset/kicks | |
| recursive: true | |
| sample_rate: ${sampling_rate} | |
| transforms: | |
| _target_: audio_data_pytorch.AllTransform | |
| crop_size: ${length} | |
| stereo: true | |
| source_rate: ${sampling_rate} | |
| target_rate: ${sampling_rate} | |
| loudness: -20 | |
| val_split: 0.05 | |
| batch_size: ${batch_size} | |
| num_workers: ${num_workers} | |
| pin_memory: true | |
| callbacks: | |
| rich_progress_bar: | |
| _target_: pytorch_lightning.callbacks.RichProgressBar | |
| model_checkpoint: | |
| _target_: pytorch_lightning.callbacks.ModelCheckpoint | |
| monitor: valid_loss | |
| save_top_k: 1 | |
| save_last: true | |
| mode: min | |
| verbose: false | |
| dirpath: ${logs_dir}/ckpts/${now:%Y-%m-%d-%H-%M-%S} | |
| filename: '{epoch:02d}-{valid_loss:.3f}' | |
| model_summary: | |
| _target_: pytorch_lightning.callbacks.RichModelSummary | |
| max_depth: 2 | |
| audio_samples_logger: | |
| _target_: main.module_base.SampleLogger | |
| num_items: 4 | |
| channels: ${channels} | |
| sampling_rate: ${sampling_rate} | |
| length: ${length} | |
| sampling_steps: | |
| - 50 | |
| use_ema_model: true | |
| loggers: | |
| wandb: | |
| _target_: pytorch_lightning.loggers.wandb.WandbLogger | |
| project: ${oc.env:WANDB_PROJECT} | |
| entity: ${oc.env:WANDB_ENTITY} | |
| name: kicks_v7 | |
| job_type: train | |
| group: '' | |
| save_dir: ${logs_dir} | |
| trainer: | |
| _target_: pytorch_lightning.Trainer | |
| gpus: 1 | |
| precision: 16 | |
| accelerator: gpu | |
| min_epochs: 0 | |
| max_epochs: -1 | |
| enable_model_summary: false | |
| log_every_n_steps: 1 | |
| check_val_every_n_epoch: null | |
| val_check_interval: ${log_every_n_steps} | |
| accumulate_grad_batches: ${accumulate_grad_batches} | |