Politrees commited on
Commit
b7d116d
·
verified ·
1 Parent(s): 045e132
MDX23C_models/MDX23C-8KFFT-InstVoc_HQ.ckpt DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:49d51472769e34a2501cd1da782346a3212555c3a5619fc2c53507445528d816
3
- size 448101203
 
 
 
 
MDX23C_models/MDX23C-8KFFT-InstVoc_HQ_2.ckpt DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:7d960d8e40a458120412c1bd807e013d2dbca7b959cc9da2bbcb0eb203d1daea
3
- size 448093770
 
 
 
 
MDX23C_models/MDX23C-De-Reverb-aufr33-jarredou.ckpt DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:eae2471b707758d74db38ac1b1d5800e12f57c4e9d1ebbb2faf004b8e086e914
3
- size 448098867
 
 
 
 
MDX23C_models/MDX23C-DrumSep-aufr33-jarredou.ckpt DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:d2a4aa53eb584d21eead358a4e66d1882ad182911be018f052b5da73be9096d0
3
- size 437652699
 
 
 
 
MDX23C_models/MDX23C_D1581.ckpt DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:d7d4d2137f12764950205b095da20032fef1d41f077bacc8582f20ed40e8cb28
3
- size 183379219
 
 
 
 
MDX23C_models/config_dereverb_mdx23c.yaml DELETED
@@ -1,135 +0,0 @@
1
- audio:
2
- chunk_size: 261120
3
- dim_f: 4096
4
- dim_t: 256
5
- hop_length: 1024
6
- n_fft: 8192
7
- num_channels: 2
8
- sample_rate: 44100
9
- min_mean_abs: 0.001
10
-
11
- model:
12
- act: gelu
13
- bottleneck_factor: 4
14
- growth: 128
15
- norm: InstanceNorm
16
- num_blocks_per_scale: 2
17
- num_channels: 128
18
- num_scales: 5
19
- num_subbands: 4
20
- scale:
21
- - 2
22
- - 2
23
-
24
- training:
25
- batch_size: 2
26
- gradient_accumulation_steps: 1
27
- grad_clip: 0
28
- instruments:
29
- - dry
30
- - No dry
31
- lr: 1.0e-06
32
- patience: 4
33
- reduce_factor: 0.93
34
- target_instrument: null
35
- num_epochs: 40
36
- num_steps: 1000
37
- q: 0.95
38
- coarse_loss_clip: true
39
- ema_momentum: 0.999
40
- optimizer: adamw
41
- read_metadata_procs: 8 # Number of processes to use during metadata reading for dataset. Can speed up metadata generation
42
- other_fix: false # it's needed for checking on multisong dataset if other is actually instrumental
43
- use_amp: true # enable or disable usage of mixed precision (float16) - usually it must be true
44
-
45
- augmentations:
46
- enable: false # enable or disable all augmentations (to fast disable if needed)
47
- loudness: true # randomly change loudness of each stem on the range (loudness_min; loudness_max)
48
- loudness_min: 0.5
49
- loudness_max: 1.5
50
- mixup: true # mix several stems of same type with some probability (only works for dataset types: 1, 2, 3)
51
- mixup_probs: !!python/tuple # 2 additional stems of the same type (1st with prob 0.2, 2nd with prob 0.02)
52
- - 0.2
53
- - 0.02
54
- mixup_loudness_min: 0.5
55
- mixup_loudness_max: 1.5
56
-
57
- all:
58
- channel_shuffle: 0.5 # Set 0 or lower to disable
59
- random_inverse: 0.05 # inverse track (better lower probability)
60
- random_polarity: 0.5 # polarity change (multiply waveform to -1)
61
-
62
- # pedalboard chorus block
63
- pedalboard_chorus: 0.001
64
- pedalboard_chorus_rate_hz_min: 1.0
65
- pedalboard_chorus_rate_hz_max: 7.0
66
- pedalboard_chorus_depth_min: 0.25
67
- pedalboard_chorus_depth_max: 0.95
68
- pedalboard_chorus_centre_delay_ms_min: 3
69
- pedalboard_chorus_centre_delay_ms_max: 10
70
- pedalboard_chorus_feedback_min: 0.0
71
- pedalboard_chorus_feedback_max: 0.01
72
- pedalboard_chorus_mix_min: 0.1
73
- pedalboard_chorus_mix_max: 0.9
74
-
75
- # pedalboard phazer block
76
- pedalboard_phazer: 0.001
77
- pedalboard_phazer_rate_hz_min: 1.0
78
- pedalboard_phazer_rate_hz_max: 10.0
79
- pedalboard_phazer_depth_min: 0.25
80
- pedalboard_phazer_depth_max: 0.95
81
- pedalboard_phazer_centre_frequency_hz_min: 200
82
- pedalboard_phazer_centre_frequency_hz_max: 12000
83
- pedalboard_phazer_feedback_min: 0.0
84
- pedalboard_phazer_feedback_max: 0.5
85
- pedalboard_phazer_mix_min: 0.1
86
- pedalboard_phazer_mix_max: 0.9
87
-
88
- # pedalboard pitch shift block
89
- pedalboard_pitch_shift: 0.01
90
- pedalboard_pitch_shift_semitones_min: -7
91
- pedalboard_pitch_shift_semitones_max: 7
92
-
93
- # pedalboard resample block
94
- pedalboard_resample: 0.001
95
- pedalboard_resample_target_sample_rate_min: 4000
96
- pedalboard_resample_target_sample_rate_max: 44100
97
-
98
- mp3_compression_min_bitrate: 32
99
- mp3_compression_max_bitrate: 320
100
- mp3_compression_backend: "lameenc"
101
-
102
- dry:
103
- # pedalboard distortion block
104
- pedalboard_distortion: 0.001
105
- pedalboard_distortion_drive_db_min: 1.0
106
- pedalboard_distortion_drive_db_max: 25.0
107
-
108
- tanh_distortion: 0.05
109
- tanh_distortion_min: 0.1
110
- tanh_distortion_max: 0.7
111
- # pedalboard bitcrash block
112
- pedalboard_bitcrash: 0.005
113
- pedalboard_bitcrash_bit_depth_min: 4
114
- pedalboard_bitcrash_bit_depth_max: 16
115
-
116
- seven_band_parametric_eq: 0.24
117
- seven_band_parametric_eq_min_gain_db: -9
118
- seven_band_parametric_eq_max_gain_db: 9
119
-
120
- gaussian_noise: 0.005
121
- gaussian_noise_min_amplitude: 0.001
122
- gaussian_noise_max_amplitude: 0.01
123
-
124
- time_stretch: 0.01
125
- time_stretch_min_rate: 0.8
126
- time_stretch_max_rate: 1.25
127
- other:
128
- seven_band_parametric_eq: 0.24
129
- seven_band_parametric_eq_min_gain_db: -9
130
- seven_band_parametric_eq_max_gain_db: 9
131
-
132
- inference:
133
- batch_size: 2
134
- dim_t: 256
135
- num_overlap: 4
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
MDX23C_models/config_drumsep_mdx23c.yaml DELETED
@@ -1,87 +0,0 @@
1
- audio:
2
- chunk_size: 130560
3
- dim_f: 1024
4
- dim_t: 256
5
- hop_length: 512
6
- n_fft: 2048
7
- num_channels: 2
8
- sample_rate: 44100
9
- min_mean_abs: 0.001
10
-
11
- model:
12
- act: gelu
13
- bottleneck_factor: 4
14
- growth: 128
15
- norm: InstanceNorm
16
- num_blocks_per_scale: 2
17
- num_channels: 128
18
- num_scales: 5
19
- num_subbands: 4
20
- scale:
21
- - 2
22
- - 2
23
-
24
- training:
25
- batch_size: 12
26
- gradient_accumulation_steps: 1
27
- grad_clip: 0
28
- instruments:
29
- - kick
30
- - snare
31
- - toms
32
- - hh
33
- - ride
34
- - crash
35
- lr: 9.0e-05
36
- patience: 30
37
- reduce_factor: 0.95
38
- target_instrument: null
39
- num_epochs: 1000
40
- num_steps: 1268
41
- q: 0.95
42
- coarse_loss_clip: true
43
- ema_momentum: 0.999
44
- optimizer: adam
45
- other_fix: false # it's needed for checking on multisong dataset if other is actually instrumental
46
- use_amp: true # enable or disable usage of mixed precision (float16) - usually it must be true
47
-
48
- augmentations:
49
- enable: true # enable or disable all augmentations (to fast disable if needed)
50
- loudness: true # randomly change loudness of each stem on the range (loudness_min; loudness_max)
51
- loudness_min: 0.5
52
- loudness_max: 1.5
53
- mixup: true # mix several stems of same type with some probability (only works for dataset types: 1, 2, 3)
54
- mixup_probs: !!python/tuple # 2 additional stems of the same type (1st with prob 0.2, 2nd with prob 0.02)
55
- - 0.2
56
- - 0.02
57
- mixup_loudness_min: 0.5
58
- mixup_loudness_max: 1.5
59
-
60
- # apply mp3 compression to mixture only (emulate downloading mp3 from internet)
61
- mp3_compression_on_mixture: 0.0
62
- mp3_compression_on_mixture_bitrate_min: 32
63
- mp3_compression_on_mixture_bitrate_max: 320
64
- mp3_compression_on_mixture_backend: "lameenc"
65
-
66
- all:
67
- channel_shuffle: 0.5 # Set 0 or lower to disable
68
- random_inverse: 0.01 # inverse track (better lower probability)
69
- random_polarity: 0.5 # polarity change (multiply waveform to -1)
70
- mp3_compression: 0.0
71
- mp3_compression_min_bitrate: 32
72
- mp3_compression_max_bitrate: 320
73
- mp3_compression_backend: "lameenc"
74
- pitch_shift: 0.1
75
- pitch_shift_min_semitones: -3
76
- pitch_shift_max_semitones: 3
77
- seven_band_parametric_eq: 0.5
78
- seven_band_parametric_eq_min_gain_db: -6
79
- seven_band_parametric_eq_max_gain_db: 6
80
- tanh_distortion: 0.2
81
- tanh_distortion_min: 0.1
82
- tanh_distortion_max: 0.5
83
-
84
- inference:
85
- batch_size: 1
86
- dim_t: 256
87
- num_overlap: 4
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
MDX23C_models/config_mdx23c_similarity.yaml DELETED
@@ -1,47 +0,0 @@
1
- audio:
2
- chunk_size: 130560
3
- dim_f: 1024
4
- dim_t: 256
5
- hop_length: 512
6
- n_fft: 2048
7
- num_channels: 2
8
- sample_rate: 44100
9
- min_mean_abs: 0.001
10
-
11
- model:
12
- act: gelu
13
- bottleneck_factor: 4
14
- growth: 128
15
- norm: InstanceNorm
16
- num_blocks_per_scale: 2
17
- num_channels: 128
18
- num_scales: 5
19
- num_subbands: 4
20
- scale:
21
- - 2
22
- - 2
23
-
24
- training:
25
- batch_size: 2
26
- gradient_accumulation_steps: 3
27
- grad_clip: 0
28
- instruments:
29
- - Similarity
30
- - Difference
31
- lr: 1.0
32
- patience: 15
33
- reduce_factor: 0.95
34
- target_instrument: Similarity
35
- num_epochs: 1000
36
- num_steps: 2235
37
- q: 0.95
38
- coarse_loss_clip: true
39
- ema_momentum: 0.999
40
- optimizer: prodigy
41
- other_fix: false # it's needed for checking on multisong dataset if other is actually instrumental
42
- use_amp: true # enable or disable usage of mixed precision (float16) - usually it must be true
43
-
44
- inference:
45
- batch_size: 8
46
- dim_t: 256
47
- num_overlap: 8
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
MDX23C_models/model_2_stem_061321.yaml DELETED
@@ -1,36 +0,0 @@
1
- audio:
2
- chunk_size: 260096
3
- dim_f: 4096
4
- dim_t: 256
5
- hop_length: 2048
6
- n_fft: 12288
7
- num_channels: 2
8
- sample_rate: 44100
9
- min_mean_abs: 0.001
10
- model:
11
- act: gelu
12
- bottleneck_factor: 4
13
- growth: 64
14
- norm: InstanceNorm
15
- num_blocks_per_scale: 2
16
- num_channels: 128
17
- num_scales: 5
18
- num_subbands: 4
19
- scale:
20
- - 2
21
- - 2
22
- name: epoch_10.ckpt
23
- training:
24
- batch_size: 16
25
- grad_clip: 0
26
- instruments:
27
- - Vocals
28
- - Instrumental
29
- lr: 5.0e-05
30
- target_instrument: null
31
- num_epochs: 100
32
- num_steps: 1000
33
- inference:
34
- batch_size: 1
35
- dim_t: 256
36
- num_overlap: 8
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
MDX23C_models/model_2_stem_full_band_8k.yaml DELETED
@@ -1,43 +0,0 @@
1
- audio:
2
- chunk_size: 261120
3
- dim_f: 4096
4
- dim_t: 256
5
- hop_length: 1024
6
- n_fft: 8192
7
- num_channels: 2
8
- sample_rate: 44100
9
- min_mean_abs: 0.001
10
- model:
11
- act: gelu
12
- bottleneck_factor: 4
13
- growth: 128
14
- norm: InstanceNorm
15
- num_blocks_per_scale: 2
16
- num_channels: 128
17
- num_scales: 5
18
- num_subbands: 4
19
- scale:
20
- - 2
21
- - 2
22
- training:
23
- batch_size: 6
24
- grad_clip: 0
25
- instruments:
26
- - Vocals
27
- - Instrumental
28
- lr: 1.0e-05
29
- patience: 2
30
- reduce_factor: 0.95
31
- target_instrument: null
32
- num_epochs: 1000
33
- num_steps: 1000
34
- augmentation: 1
35
- augmentation_type: simple1
36
- augmentation_mix: true
37
- q: 0.95
38
- coarse_loss_clip: true
39
- ema_momentum: 0.999
40
- inference:
41
- batch_size: 1
42
- dim_t: 256
43
- num_overlap: 8
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
MDX23C_models/model_mdx23c_ep_271_l1_freq_72.2383.ckpt DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:1227f8d97c7436004d03e46091427393abefebcc08ce53ef30082742c4e482f7
3
- size 437613512