| |
|
|
| defaults: |
| - /solver/default |
| - /conditioner: none |
| - _self_ |
| - /solver/musicgen/evaluation: none |
| - override /dset: audio/default |
|
|
| autocast: true |
| autocast_dtype: float16 |
|
|
| solver: musicgen |
| sample_rate: ??? |
| channels: ??? |
| compression_model_checkpoint: ??? |
| |
| |
| |
| |
| |
| compression_model_n_q: null |
|
|
| tokens: |
| padding_with_special_token: false |
|
|
| interleave_stereo_codebooks: |
| use: false |
| per_timestep: false |
|
|
| cache: |
| path: |
| write: false |
| write_shard: 0 |
| write_num_shards: 1 |
|
|
|
|
| dataset: |
| batch_size: 128 |
| num_workers: 10 |
| segment_duration: 30 |
| min_segment_ratio: 0.8 |
| return_info: true |
| train: |
| num_samples: 1000000 |
| valid: |
| num_samples: 10000 |
| generate: |
| num_samples: 50 |
|
|
| metrics: |
| fad: |
| use_gt: false |
| model: tf |
| tf: |
| bin: null |
| model_path: //reference/fad/vggish_model.ckpt |
| kld: |
| use_gt: false |
| model: passt |
| passt: |
| pretrained_length: 20 |
| text_consistency: |
| use_gt: false |
| model: clap |
| clap: |
| model_path: //reference/clap/music_audioset_epoch_15_esc_90.14.pt |
| model_arch: 'HTSAT-base' |
| enable_fusion: false |
| chroma_cosine: |
| use_gt: false |
| model: chroma_base |
| chroma_base: |
| sample_rate: ${sample_rate} |
| n_chroma: 12 |
| radix2_exp: 14 |
| argmax: true |
|
|
| generate: |
| every: 25 |
| num_workers: 5 |
| path: samples |
| audio: |
| format: wav |
| strategy: loudness |
| sample_rate: ${sample_rate} |
| loudness_headroom_db: 14 |
| lm: |
| prompted_samples: true |
| unprompted_samples: true |
| gen_gt_samples: false |
| prompt_duration: null |
| gen_duration: null |
| remove_prompts: false |
| |
| use_sampling: false |
| temp: 1.0 |
| top_k: 0 |
| top_p: 0.0 |
| evaluate: |
| every: 25 |
| num_workers: 5 |
| metrics: |
| base: false |
| fad: false |
| kld: false |
| text_consistency: false |
| chroma_cosine: false |
|
|
| checkpoint: |
| save_last: true |
| save_every: 50 |
| keep_last: 10 |
| keep_every_states: null |
|
|
| optim: |
| epochs: 200 |
| updates_per_epoch: 2000 |
| lr: 1e-4 |
| optimizer: adamw |
| max_norm: 1.0 |
| eager_sync: true |
| adam: |
| betas: [0.9, 0.95] |
| weight_decay: 0.1 |
| eps: 1e-8 |
|
|
| schedule: |
| lr_scheduler: null |
|
|