lukewys's picture
Upload 8 files
db99744 verified
AdamW.amsgrad: false
AdamW.betas: !!python/tuple
- 0.9
- 0.999
AdamW.capturable: false
AdamW.differentiable: false
AdamW.eps: 1.0e-08
AdamW.lr: 0.0001
AdamW.maximize: false
AdamW.weight_decay: 0.01
LinearWarmupCosineDecay.eta_min: 1.0e-05
LinearWarmupCosineDecay.last_iter: -1
LinearWarmupCosineDecay.total_iters: 100000
LinearWarmupCosineDecay.warmup_iters: 10000
PrefixDecoderTransformerMultiOut.attn_dropout: 0.1
PrefixDecoderTransformerMultiOut.cross_attend: false
PrefixDecoderTransformerMultiOut.depth: 16
PrefixDecoderTransformerMultiOut.dim: 1024
PrefixDecoderTransformerMultiOut.ff_dropout: 0.1
PrefixDecoderTransformerMultiOut.heads: 16
PrefixDecoderTransformerMultiOut.input_delay: 0
PrefixDecoderTransformerMultiOut.input_emb_dim: 128
PrefixDecoderTransformerMultiOut.max_seq_len: 512
PrefixDecoderTransformerMultiOut.num_rvq_layers: 4
PrefixDecoderTransformerMultiOut.num_tokens: 1024
PrefixDecoderTransformerMultiOut.output_emb_dim: 1024
PrefixDecoderTransformerMultiOut.pad_value: 0
PrefixDecoderTransformerMultiOut.shared: false
PrefixDecoderTransformerMultiOut.use_delay_pattern: false
accelerator: auto
add_inst_tokens: false
args.debug: 0
args.load: configs/multiout/prefix_decoder_base_cluster.yml
args.save: null
args.unknown: []
batch_size: 32
cfg_drop_prob: 0.0
checkpoint_interval: 5000
checkpoint_metric: val/loss
checkpoint_mode: min
checkpoint_top_k: -1
compile: true
data_base_dir: /network/scratch/w/wu.yusong/precompute_audio_mixdown_10s
dataset_names:
- slakh2100
devices: auto
duration: 10
gradient_clip_val: 1.0
inst_tokens_as_pattern_token: true
limit_val_batches: 128
load_audio: 'false'
load_from_latest_checkpoint: true
log_every_n_steps: 1
max_duration: 10
max_log_examples: 8
num_nodes: 1
num_rvq_layers: 4
num_workers: 8
overfit_batches: 0
pattern: flatten
precision: bf16-mixed
rms_base_dir: /network/scratch/w/wu.yusong/rms_50hz
sample_interval: 10000
save_dir: /network/scratch/w/wu.yusong/online_stem_gen_logs/prefix_decoder_base
seed: 42
shuffle: false
split: train
strategy: auto
train_steps: 100000
use_fabric: false
val_interval: 1000
wandb_project: online-stem-gen
weights:
- 1