File size: 2,170 Bytes
db99744 | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 | AdamW.amsgrad: false
AdamW.betas: !!python/tuple
- 0.9
- 0.999
AdamW.capturable: false
AdamW.differentiable: false
AdamW.eps: 1.0e-08
AdamW.lr: 0.0001
AdamW.maximize: false
AdamW.weight_decay: 0.01
LinearWarmupCosineDecay.eta_min: 1.0e-05
LinearWarmupCosineDecay.last_iter: -1
LinearWarmupCosineDecay.total_iters: 100000
LinearWarmupCosineDecay.warmup_iters: 10000
PrefixDecoderTransformerMultiOut.attn_dropout: 0.1
PrefixDecoderTransformerMultiOut.cross_attend: false
PrefixDecoderTransformerMultiOut.depth: 16
PrefixDecoderTransformerMultiOut.dim: 1024
PrefixDecoderTransformerMultiOut.ff_dropout: 0.1
PrefixDecoderTransformerMultiOut.heads: 16
PrefixDecoderTransformerMultiOut.input_delay: 0
PrefixDecoderTransformerMultiOut.input_emb_dim: 128
PrefixDecoderTransformerMultiOut.max_seq_len: 512
PrefixDecoderTransformerMultiOut.num_rvq_layers: 4
PrefixDecoderTransformerMultiOut.num_tokens: 1024
PrefixDecoderTransformerMultiOut.output_emb_dim: 1024
PrefixDecoderTransformerMultiOut.pad_value: 0
PrefixDecoderTransformerMultiOut.shared: false
PrefixDecoderTransformerMultiOut.use_delay_pattern: false
accelerator: auto
add_inst_tokens: false
args.debug: 0
args.load: configs/multiout/prefix_decoder_base_cluster.yml
args.save: null
args.unknown: []
batch_size: 32
cfg_drop_prob: 0.0
checkpoint_interval: 5000
checkpoint_metric: val/loss
checkpoint_mode: min
checkpoint_top_k: -1
compile: true
data_base_dir: /network/scratch/w/wu.yusong/precompute_audio_mixdown_10s
dataset_names:
- slakh2100
devices: auto
duration: 10
gradient_clip_val: 1.0
inst_tokens_as_pattern_token: true
limit_val_batches: 128
load_audio: 'false'
load_from_latest_checkpoint: true
log_every_n_steps: 1
max_duration: 10
max_log_examples: 8
num_nodes: 1
num_rvq_layers: 4
num_workers: 8
overfit_batches: 0
pattern: flatten
precision: bf16-mixed
rms_base_dir: /network/scratch/w/wu.yusong/rms_50hz
sample_interval: 10000
save_dir: /network/scratch/w/wu.yusong/online_stem_gen_logs/prefix_decoder_base
seed: 42
shuffle: false
split: train
strategy: auto
train_steps: 100000
use_fabric: false
val_interval: 1000
wandb_project: online-stem-gen
weights:
- 1
|