AdamW.amsgrad: false AdamW.betas: !!python/tuple - 0.9 - 0.999 AdamW.capturable: false AdamW.differentiable: false AdamW.eps: 1.0e-08 AdamW.lr: 0.0001 AdamW.maximize: false AdamW.weight_decay: 0.01 LinearWarmupCosineDecay.eta_min: 1.0e-05 LinearWarmupCosineDecay.last_iter: -1 LinearWarmupCosineDecay.total_iters: 100000 LinearWarmupCosineDecay.warmup_iters: 10000 PrefixDecoderTransformerMultiOut.attn_dropout: 0.1 PrefixDecoderTransformerMultiOut.cross_attend: false PrefixDecoderTransformerMultiOut.depth: 16 PrefixDecoderTransformerMultiOut.dim: 1024 PrefixDecoderTransformerMultiOut.ff_dropout: 0.1 PrefixDecoderTransformerMultiOut.heads: 16 PrefixDecoderTransformerMultiOut.input_delay: 0 PrefixDecoderTransformerMultiOut.input_emb_dim: 128 PrefixDecoderTransformerMultiOut.max_seq_len: 512 PrefixDecoderTransformerMultiOut.num_rvq_layers: 4 PrefixDecoderTransformerMultiOut.num_tokens: 1024 PrefixDecoderTransformerMultiOut.output_emb_dim: 1024 PrefixDecoderTransformerMultiOut.pad_value: 0 PrefixDecoderTransformerMultiOut.shared: false PrefixDecoderTransformerMultiOut.use_delay_pattern: false accelerator: auto add_inst_tokens: false args.debug: 0 args.load: configs/multiout/prefix_decoder_base_cluster.yml args.save: null args.unknown: [] batch_size: 32 cfg_drop_prob: 0.0 checkpoint_interval: 5000 checkpoint_metric: val/loss checkpoint_mode: min checkpoint_top_k: -1 compile: true data_base_dir: /network/scratch/w/wu.yusong/precompute_audio_mixdown_10s dataset_names: - slakh2100 devices: auto duration: 10 gradient_clip_val: 1.0 inst_tokens_as_pattern_token: true limit_val_batches: 128 load_audio: 'false' load_from_latest_checkpoint: true log_every_n_steps: 1 max_duration: 10 max_log_examples: 8 num_nodes: 1 num_rvq_layers: 4 num_workers: 8 overfit_batches: 0 pattern: flatten precision: bf16-mixed rms_base_dir: /network/scratch/w/wu.yusong/rms_50hz sample_interval: 10000 save_dir: /network/scratch/w/wu.yusong/online_stem_gen_logs/prefix_decoder_base seed: 42 shuffle: false split: train strategy: auto train_steps: 100000 use_fabric: false val_interval: 1000 wandb_project: online-stem-gen weights: - 1