xavriley commited on
Commit
54937fb
·
verified ·
1 Parent(s): e5d2b5b

Upload config_mdx23c_drumsep2025.yaml with huggingface_hub

Browse files
Files changed (1) hide show
  1. config_mdx23c_drumsep2025.yaml +70 -0
config_mdx23c_drumsep2025.yaml ADDED
@@ -0,0 +1,70 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ audio:
2
+ chunk_size: 523776
3
+ dim_f: 1024
4
+ dim_t: 1024
5
+ hop_length: 512
6
+ n_fft: 2048
7
+ num_channels: 2
8
+ sample_rate: 44100
9
+ min_mean_abs: 0.000
10
+
11
+ model:
12
+ act: gelu
13
+ bottleneck_factor: 4
14
+ growth: 128
15
+ norm: InstanceNorm
16
+ num_blocks_per_scale: 2
17
+ num_channels: 128
18
+ num_scales: 5
19
+ num_subbands: 4
20
+ scale:
21
+ - 2
22
+ - 2
23
+
24
+ training:
25
+ batch_size: 2
26
+ gradient_accumulation_steps: 4
27
+ grad_clip: 0
28
+ instruments:
29
+ - kick
30
+ - snare
31
+ - toms
32
+ - hh
33
+ - cymbals
34
+ lr: 1.0
35
+ patience: 200
36
+ reduce_factor: 0.95
37
+ target_instrument: null
38
+ num_epochs: 1000
39
+ num_steps: 1533
40
+ q: 0.95
41
+ coarse_loss_clip: true
42
+ ema_momentum: 0.999
43
+ optimizer: prodigy
44
+ other_fix: false # it's needed for checking on multisong dataset if other is actually instrumental
45
+ use_amp: true # enable or disable usage of mixed precision (float16) - usually it must be true
46
+
47
+ loss_multistft:
48
+ fft_sizes:
49
+ - 2048
50
+ hop_sizes:
51
+ - 1024
52
+ win_lengths:
53
+ - 2048
54
+ window: "hann_window"
55
+ sample_rate: 44100
56
+ perceptual_weighting: false
57
+ scale: "mel"
58
+ n_bins: 128
59
+ w_sc: 0.0
60
+ w_log_mag: 1.0
61
+ w_lin_mag: 0.0
62
+ w_phs: 0.0
63
+ mag_distance: "L1"
64
+
65
+ inference:
66
+ extension: flac
67
+ batch_size: 2
68
+ dim_t: 512
69
+ num_overlap: 4
70
+ normalize: false