Politrees commited on
Commit
77f2a1d
·
verified ·
1 Parent(s): c9b303e
SCnet_models/SCNet-large_starrytong_fixed.ckpt DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:65900dfa07d6b6e5d784c0f143920200a4bd281d6e78a806c549d0b912d5885e
3
- size 168852258
 
 
 
 
SCnet_models/config_musdb18_scnet.yaml DELETED
@@ -1,83 +0,0 @@
1
- audio:
2
- chunk_size: 485100 # 44100 * 11
3
- num_channels: 2
4
- sample_rate: 44100
5
- min_mean_abs: 0.000
6
-
7
- model:
8
- sources:
9
- - drums
10
- - bass
11
- - other
12
- - vocals
13
- audio_channels: 2
14
- dims:
15
- - 4
16
- - 32
17
- - 64
18
- - 128
19
- nfft: 4096
20
- hop_size: 1024
21
- win_size: 4096
22
- normalized: True
23
- band_SR:
24
- - 0.175
25
- - 0.392
26
- - 0.433
27
- band_stride:
28
- - 1
29
- - 4
30
- - 16
31
- band_kernel:
32
- - 3
33
- - 4
34
- - 16
35
- conv_depths:
36
- - 3
37
- - 2
38
- - 1
39
- compress: 4
40
- conv_kernel: 3
41
- num_dplayer: 6
42
- expand: 1
43
-
44
- training:
45
- batch_size: 10
46
- gradient_accumulation_steps: 1
47
- grad_clip: 0
48
- instruments:
49
- - Drums
50
- - Bass
51
- - Other
52
- - Vocals
53
- lr: 5.0e-04
54
- patience: 2
55
- reduce_factor: 0.95
56
- target_instrument: null
57
- num_epochs: 1000
58
- num_steps: 1000
59
- q: 0.95
60
- coarse_loss_clip: true
61
- ema_momentum: 0.999
62
- optimizer: adam
63
- other_fix: false # it's needed for checking on multisong dataset if other is actually instrumental
64
- use_amp: true # enable or disable usage of mixed precision (float16) - usually it must be true
65
-
66
- augmentations:
67
- enable: true # enable or disable all augmentations (to fast disable if needed)
68
- loudness: true # randomly change loudness of each stem on the range (loudness_min; loudness_max)
69
- loudness_min: 0.5
70
- loudness_max: 1.5
71
- mixup: true # mix several stems of same type with some probability (only works for dataset types: 1, 2, 3)
72
- mixup_probs:
73
- !!python/tuple # 2 additional stems of the same type (1st with prob 0.2, 2nd with prob 0.02)
74
- - 0.2
75
- - 0.02
76
- mixup_loudness_min: 0.5
77
- mixup_loudness_max: 1.5
78
-
79
- inference:
80
- batch_size: 8
81
- dim_t: 256
82
- num_overlap: 4
83
- normalize: true
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
SCnet_models/config_musdb18_scnet_large.yaml DELETED
@@ -1,88 +0,0 @@
1
- audio:
2
- chunk_size: 485100 # 44100 * 11
3
- num_channels: 2
4
- sample_rate: 44100
5
- min_mean_abs: 0.000
6
-
7
- model:
8
- sources:
9
- - drums
10
- - bass
11
- - other
12
- - vocals
13
- audio_channels: 2
14
- dims:
15
- - 4
16
- - 64
17
- - 128
18
- - 256
19
- nfft: 4096
20
- hop_size: 1024
21
- win_size: 4096
22
- normalized: True
23
- band_SR:
24
- - 0.225
25
- - 0.372
26
- - 0.403
27
- band_stride:
28
- - 1
29
- - 4
30
- - 16
31
- band_kernel:
32
- - 3
33
- - 4
34
- - 16
35
- conv_depths:
36
- - 3
37
- - 2
38
- - 1
39
- compress: 4
40
- conv_kernel: 3
41
- num_dplayer: 6
42
- expand: 1
43
-
44
- training:
45
- batch_size: 6
46
- gradient_accumulation_steps: 1
47
- grad_clip: 0
48
- instruments:
49
- - Drums
50
- - Bass
51
- - Other
52
- - Vocals
53
- # lr: 1.0e-04
54
- lr: 1.0
55
- patience: 2
56
- reduce_factor: 0.95
57
- target_instrument: null
58
- num_epochs: 1000
59
- num_steps: 1000
60
- q: 0.95
61
- coarse_loss_clip: true
62
- ema_momentum: 0.999
63
- optimizer: prodigy
64
- other_fix: false # it's needed for checking on multisong dataset if other is actually instrumental
65
- use_amp: true # enable or disable usage of mixed precision (float16) - usually it must be true
66
-
67
- augmentations:
68
- enable: true # enable or disable all augmentations (to fast disable if needed)
69
- loudness: true # randomly change loudness of each stem on the range (loudness_min; loudness_max)
70
- loudness_min: 0.5
71
- loudness_max: 1.5
72
- mixup: true # mix several stems of same type with some probability (only works for dataset types: 1, 2, 3)
73
- mixup_probs:
74
- !!python/tuple # 2 additional stems of the same type (1st with prob 0.2, 2nd with prob 0.02)
75
- - 0.2
76
- - 0.02
77
- mixup_loudness_min: 0.5
78
- mixup_loudness_max: 1.5
79
- all:
80
- channel_shuffle: 0.5 # Set 0 or lower to disable
81
- random_inverse: 0.1 # inverse track (better lower probability)
82
- random_polarity: 0.5 # polarity change (multiply waveform to -1)
83
-
84
- inference:
85
- batch_size: 8
86
- dim_t: 256
87
- num_overlap: 4
88
- normalize: false
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
SCnet_models/config_musdb18_scnet_large_starrytong.yaml DELETED
@@ -1,88 +0,0 @@
1
- audio:
2
- chunk_size: 485100 # 44100 * 11
3
- num_channels: 2
4
- sample_rate: 44100
5
- min_mean_abs: 0.000
6
-
7
- model:
8
- sources:
9
- - drums
10
- - bass
11
- - other
12
- - vocals
13
- audio_channels: 2
14
- dims:
15
- - 4
16
- - 64
17
- - 128
18
- - 256
19
- nfft: 4096
20
- hop_size: 1024
21
- win_size: 4096
22
- normalized: True
23
- band_SR:
24
- - 0.225
25
- - 0.372
26
- - 0.403
27
- band_stride:
28
- - 1
29
- - 4
30
- - 16
31
- band_kernel:
32
- - 3
33
- - 4
34
- - 16
35
- conv_depths:
36
- - 3
37
- - 2
38
- - 1
39
- compress: 4
40
- conv_kernel: 3
41
- num_dplayer: 6
42
- expand: 1
43
-
44
- training:
45
- batch_size: 6
46
- gradient_accumulation_steps: 1
47
- grad_clip: 0
48
- instruments:
49
- - Drums
50
- - Bass
51
- - Other
52
- - Vocals
53
- # lr: 1.0e-04
54
- lr: 1.0
55
- patience: 2
56
- reduce_factor: 0.95
57
- target_instrument: null
58
- num_epochs: 1000
59
- num_steps: 1000
60
- q: 0.95
61
- coarse_loss_clip: true
62
- ema_momentum: 0.999
63
- optimizer: prodigy
64
- other_fix: false # it's needed for checking on multisong dataset if other is actually instrumental
65
- use_amp: true # enable or disable usage of mixed precision (float16) - usually it must be true
66
-
67
- augmentations:
68
- enable: true # enable or disable all augmentations (to fast disable if needed)
69
- loudness: true # randomly change loudness of each stem on the range (loudness_min; loudness_max)
70
- loudness_min: 0.5
71
- loudness_max: 1.5
72
- mixup: true # mix several stems of same type with some probability (only works for dataset types: 1, 2, 3)
73
- mixup_probs:
74
- !!python/tuple # 2 additional stems of the same type (1st with prob 0.2, 2nd with prob 0.02)
75
- - 0.2
76
- - 0.02
77
- mixup_loudness_min: 0.5
78
- mixup_loudness_max: 1.5
79
- all:
80
- channel_shuffle: 0.5 # Set 0 or lower to disable
81
- random_inverse: 0.1 # inverse track (better lower probability)
82
- random_polarity: 0.5 # polarity change (multiply waveform to -1)
83
-
84
- inference:
85
- batch_size: 8
86
- dim_t: 256
87
- num_overlap: 4
88
- normalize: true
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
SCnet_models/config_musdb18_scnet_xl.yaml DELETED
@@ -1,207 +0,0 @@
1
- audio:
2
- chunk_size: 485100 # 44100 * 11
3
- num_channels: 2
4
- sample_rate: 44100
5
- min_mean_abs: 0.000
6
-
7
- model:
8
- sources:
9
- - drums
10
- - bass
11
- - other
12
- - vocals
13
- audio_channels: 2
14
- dims:
15
- - 4
16
- - 64
17
- - 128
18
- - 256
19
- nfft: 4096
20
- hop_size: 1024
21
- win_size: 4096
22
- normalized: True
23
- band_SR:
24
- - 0.230
25
- - 0.370
26
- - 0.400
27
- band_stride:
28
- - 1
29
- - 4
30
- - 16
31
- band_kernel:
32
- - 3
33
- - 4
34
- - 16
35
- conv_depths:
36
- - 3
37
- - 2
38
- - 1
39
- compress: 4
40
- conv_kernel: 3
41
- num_dplayer: 8
42
- expand: 1
43
-
44
- training:
45
- batch_size: 4
46
- gradient_accumulation_steps: 1
47
- grad_clip: 0
48
- instruments:
49
- - Drums
50
- - Bass
51
- - Other
52
- - Vocals
53
- patience: 2
54
- reduce_factor: 0.95
55
- target_instrument: null
56
- num_epochs: 1000
57
- num_steps: 1000
58
- q: 0.95
59
- coarse_loss_clip: true
60
- ema_momentum: 0.999
61
- # optimizer: prodigy
62
- optimizer: adam
63
- lr: 1.0e-05
64
- # lr: 1.0
65
- normalize: false # perform normalization on input of model (use the same for inference!)
66
- other_fix: false # it's needed for checking on multisong dataset if other is actually instrumental
67
- use_amp: true # enable or disable usage of mixed precision (float16) - usually it must be true
68
-
69
-
70
- augmentations:
71
- enable: false # enable or disable all augmentations (to fast disable if needed)
72
- loudness: true # randomly change loudness of each stem on the range (loudness_min; loudness_max)
73
- loudness_min: 0.5
74
- loudness_max: 1.5
75
- mixup: true # mix several stems of same type with some probability (only works for dataset types: 1, 2, 3)
76
- mixup_probs: !!python/tuple # 2 additional stems of the same type (1st with prob 0.2, 2nd with prob 0.02)
77
- - 0.2
78
- - 0.02
79
- mixup_loudness_min: 0.5
80
- mixup_loudness_max: 1.5
81
-
82
- # apply mp3 compression to mixture only (emulate downloading mp3 from internet)
83
- mp3_compression_on_mixture: 0.01
84
- mp3_compression_on_mixture_bitrate_min: 32
85
- mp3_compression_on_mixture_bitrate_max: 320
86
- mp3_compression_on_mixture_backend: "lameenc"
87
-
88
- all:
89
- channel_shuffle: 0.5 # Set 0 or lower to disable
90
- random_inverse: 0.1 # inverse track (better lower probability)
91
- random_polarity: 0.5 # polarity change (multiply waveform to -1)
92
-
93
- mp3_compression: 0.01
94
- mp3_compression_min_bitrate: 32
95
- mp3_compression_max_bitrate: 320
96
- mp3_compression_backend: "lameenc"
97
-
98
- # pedalboard reverb block
99
- pedalboard_reverb: 0.01
100
- pedalboard_reverb_room_size_min: 0.1
101
- pedalboard_reverb_room_size_max: 0.9
102
- pedalboard_reverb_damping_min: 0.1
103
- pedalboard_reverb_damping_max: 0.9
104
- pedalboard_reverb_wet_level_min: 0.1
105
- pedalboard_reverb_wet_level_max: 0.9
106
- pedalboard_reverb_dry_level_min: 0.1
107
- pedalboard_reverb_dry_level_max: 0.9
108
- pedalboard_reverb_width_min: 0.9
109
- pedalboard_reverb_width_max: 1.0
110
-
111
- # pedalboard chorus block
112
- pedalboard_chorus: 0.01
113
- pedalboard_chorus_rate_hz_min: 1.0
114
- pedalboard_chorus_rate_hz_max: 7.0
115
- pedalboard_chorus_depth_min: 0.25
116
- pedalboard_chorus_depth_max: 0.95
117
- pedalboard_chorus_centre_delay_ms_min: 3
118
- pedalboard_chorus_centre_delay_ms_max: 10
119
- pedalboard_chorus_feedback_min: 0.0
120
- pedalboard_chorus_feedback_max: 0.5
121
- pedalboard_chorus_mix_min: 0.1
122
- pedalboard_chorus_mix_max: 0.9
123
-
124
- # pedalboard phazer block
125
- pedalboard_phazer: 0.01
126
- pedalboard_phazer_rate_hz_min: 1.0
127
- pedalboard_phazer_rate_hz_max: 10.0
128
- pedalboard_phazer_depth_min: 0.25
129
- pedalboard_phazer_depth_max: 0.95
130
- pedalboard_phazer_centre_frequency_hz_min: 200
131
- pedalboard_phazer_centre_frequency_hz_max: 12000
132
- pedalboard_phazer_feedback_min: 0.0
133
- pedalboard_phazer_feedback_max: 0.5
134
- pedalboard_phazer_mix_min: 0.1
135
- pedalboard_phazer_mix_max: 0.9
136
-
137
- # pedalboard distortion block
138
- pedalboard_distortion: 0.01
139
- pedalboard_distortion_drive_db_min: 1.0
140
- pedalboard_distortion_drive_db_max: 25.0
141
-
142
- # pedalboard pitch shift block
143
- pedalboard_pitch_shift: 0.01
144
- pedalboard_pitch_shift_semitones_min: -7
145
- pedalboard_pitch_shift_semitones_max: 7
146
-
147
- # pedalboard resample block
148
- pedalboard_resample: 0.01
149
- pedalboard_resample_target_sample_rate_min: 4000
150
- pedalboard_resample_target_sample_rate_max: 44100
151
-
152
- # pedalboard bitcrash block
153
- pedalboard_bitcrash: 0.01
154
- pedalboard_bitcrash_bit_depth_min: 4
155
- pedalboard_bitcrash_bit_depth_max: 16
156
-
157
- # pedalboard mp3 compressor block
158
- pedalboard_mp3_compressor: 0.01
159
- pedalboard_mp3_compressor_pedalboard_mp3_compressor_min: 0
160
- pedalboard_mp3_compressor_pedalboard_mp3_compressor_max: 9.999
161
-
162
- vocals:
163
- pitch_shift: 0.1
164
- pitch_shift_min_semitones: -5
165
- pitch_shift_max_semitones: 5
166
- seven_band_parametric_eq: 0.25
167
- seven_band_parametric_eq_min_gain_db: -9
168
- seven_band_parametric_eq_max_gain_db: 9
169
- tanh_distortion: 0.1
170
- tanh_distortion_min: 0.1
171
- tanh_distortion_max: 0.7
172
- bass:
173
- pitch_shift: 0.1
174
- pitch_shift_min_semitones: -2
175
- pitch_shift_max_semitones: 2
176
- seven_band_parametric_eq: 0.25
177
- seven_band_parametric_eq_min_gain_db: -3
178
- seven_band_parametric_eq_max_gain_db: 6
179
- tanh_distortion: 0.2
180
- tanh_distortion_min: 0.1
181
- tanh_distortion_max: 0.5
182
- drums:
183
- pitch_shift: 0.33
184
- pitch_shift_min_semitones: -5
185
- pitch_shift_max_semitones: 5
186
- seven_band_parametric_eq: 0.25
187
- seven_band_parametric_eq_min_gain_db: -9
188
- seven_band_parametric_eq_max_gain_db: 9
189
- tanh_distortion: 0.33
190
- tanh_distortion_min: 0.1
191
- tanh_distortion_max: 0.6
192
- other:
193
- pitch_shift: 0.1
194
- pitch_shift_min_semitones: -4
195
- pitch_shift_max_semitones: 4
196
- gaussian_noise: 0.1
197
- gaussian_noise_min_amplitude: 0.001
198
- gaussian_noise_max_amplitude: 0.015
199
- time_stretch: 0.01
200
- time_stretch_min_rate: 0.8
201
- time_stretch_max_rate: 1.25
202
-
203
- inference:
204
- batch_size: 4
205
- dim_t: 256
206
- num_overlap: 4
207
- normalize: false
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
SCnet_models/model_scnet_ep_54_sdr_9.8051.ckpt DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:fd889cc1d97619ccac59280ecc859c190cd3cc1b1557fbe3a19b1610bb67e410
3
- size 216189106
 
 
 
 
SCnet_models/model_scnet_sdr_9.3244.ckpt DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:fe550315a76e8f4aed8475d7d5952137504a3b6c63b3adcef2443bfe73aac540
3
- size 168868194
 
 
 
 
SCnet_models/scnet_checkpoint_musdb18.ckpt DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:1bc0d1abb20bfdf966dcd07637bafd03e4bc13653d09ef18bc9b3e342eafe2aa
3
- size 42434986