armyshope commited on
Commit
ef552c6
·
verified ·
1 Parent(s): e787ea7

Upload 2 files

Browse files
config_musdb18_bs_mamba2.yaml ADDED
@@ -0,0 +1,82 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ audio:
2
+ chunk_size: 132300 # samplerate * segment
3
+ hop_length: 1024
4
+ min_mean_abs: 0.0
5
+
6
+ training:
7
+ batch_size: 8
8
+ gradient_accumulation_steps: 1
9
+ grad_clip: 0
10
+ segment: 11
11
+ shift: 1
12
+ samplerate: 44100
13
+ channels: 2
14
+ normalize: true
15
+ instruments: ['drums', 'bass', 'other', 'vocals']
16
+ target_instrument: null
17
+ num_epochs: 1000
18
+ num_steps: 1000
19
+ optimizer: prodigy
20
+ lr: 1.0
21
+ patience: 2
22
+ reduce_factor: 0.95
23
+ q: 0.95
24
+ coarse_loss_clip: true
25
+ ema_momentum: 0.999
26
+ read_metadata_procs: 8
27
+ other_fix: false # it's needed for checking on multisong dataset if other is actually instrumental
28
+ use_amp: true # enable or disable usage of mixed precision (float16) - usually it must be true
29
+
30
+ model:
31
+ sr: 44100
32
+ win: 2048
33
+ stride: 512
34
+ feature_dim: 128
35
+ num_repeat_mask: 8
36
+ num_repeat_map: 4
37
+ num_output: 4
38
+
39
+ augmentations:
40
+ enable: true # enable or disable all augmentations (to fast disable if needed)
41
+ loudness: true # randomly change loudness of each stem on the range (loudness_min; loudness_max)
42
+ loudness_min: 0.5
43
+ loudness_max: 1.5
44
+ mixup: true # mix several stems of same type with some probability (only works for dataset types: 1, 2, 3)
45
+ mixup_probs:
46
+ !!python/tuple # 2 additional stems of the same type (1st with prob 0.2, 2nd with prob 0.02)
47
+ - 0.2
48
+ - 0.02
49
+ mixup_loudness_min: 0.5
50
+ mixup_loudness_max: 1.5
51
+ all:
52
+ channel_shuffle: 0.5 # Set 0 or lower to disable
53
+ random_inverse: 0.1 # inverse track (better lower probability)
54
+ random_polarity: 0.5 # polarity change (multiply waveform to -1)
55
+
56
+ loss_multistft:
57
+ fft_sizes:
58
+ - 1024
59
+ - 2048
60
+ - 4096
61
+ hop_sizes:
62
+ - 512
63
+ - 1024
64
+ - 2048
65
+ win_lengths:
66
+ - 1024
67
+ - 2048
68
+ - 4096
69
+ window: "hann_window"
70
+ scale: "mel"
71
+ n_bins: 128
72
+ sample_rate: 44100
73
+ perceptual_weighting: true
74
+ w_sc: 1.0
75
+ w_log_mag: 1.0
76
+ w_lin_mag: 0.0
77
+ w_phs: 0.0
78
+ mag_distance: "L1"
79
+
80
+ inference:
81
+ num_overlap: 2
82
+ batch_size: 8
model_bs_mamba2_ep_11_sdr_6.8723.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d85560e2495eb7852d78e07d7a00376aa69804089abc10b7eb27e41d5a3926f5
3
+ size 142774366