| version: "1.34" |
|
|
| lr: 1e-4 |
| log_step: 1 |
| split: 0 |
| batch_size: 8 |
| sr: 16000 |
|
|
| datasets: |
| - jamendo |
| - emomusic |
| - pmemo |
| - deam |
|
|
| model: |
| encoder: "MERT" |
| layers: |
| - 5 |
| - 6 |
| classifier: "linear-mt-attn-ck" |
| |
| |
| |
|
|
| kd: True |
| kd_weight: 0.8 |
| kd_temperature: 1 |
| lr: 1e-4 |
|
|
| |
| |
|
|
| dataset: |
| jamendo: |
| root: './dataset/jamendo' |
| subset: 'moodtheme' |
| batch_size: 8 |
| output_size : 56 |
| split: 0 |
| segment_type: "all" |
| num_workers: 4 |
| deam: |
| root: './dataset/deam' |
| batch_size: 8 |
| output_size : 2 |
| segment_type: "all" |
| num_workers: 4 |
| pmemo: |
| root: './dataset/pmemo' |
| batch_size: 8 |
| output_size : 2 |
| segment_type: "all" |
| num_workers: 4 |
| emomusic: |
| root: './dataset/emomusic' |
| batch_size: 8 |
| output_size : 2 |
| segment_type: "all" |
| num_workers: 4 |
|
|
|
|
|
|
| |
| genre_class_size: 87 |
| mood_class_size: 56 |
| instr_class_size: 40 |
| dac_latents_size: 72 |
| dac_rvq_size: 9 |
| |
|
|
|
|
| |
| checkpoint_pmemo: "tb_logs/best/P.ckpt" |
|
|
| |
| checkpoint_deam: "tb_logs/best/D.ckpt" |
|
|
| |
| checkpoint_emomusic: "tb_logs/best/E.ckpt" |
|
|
| |
| checkpoint_jamendo: "tb_logs/best/J.ckpt" |
|
|
|
|
|
|
|
|
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
|
|