Politrees commited on
Commit
4cb6bf5
·
verified ·
1 Parent(s): 707f288

Delete models/Roformer/MelBand/by_Aname

Browse files
models/Roformer/MelBand/by_Aname/config_melband_roformer_vocals_test_by_aname.yaml DELETED
@@ -1,208 +0,0 @@
1
- audio:
2
- chunk_size: 661500
3
- dim_f: 1024
4
- dim_t: 1101
5
- hop_length: 441
6
- n_fft: 2048
7
- num_channels: 2
8
- sample_rate: 44100
9
- min_mean_abs: 0.001
10
-
11
- model:
12
- dim: 512
13
- depth: 8
14
- stereo: true
15
- num_stems: 1
16
- time_transformer_depth: 1
17
- freq_transformer_depth: 1
18
- num_bands: 60
19
- dim_head: 64
20
- heads: 12
21
- attn_dropout: 0
22
- ff_dropout: 0
23
- flash_attn: True
24
- dim_freqs_in: 1025
25
- sample_rate: 44100 # needed for mel filter bank from librosa
26
- stft_n_fft: 2048
27
- stft_hop_length: 441
28
- stft_win_length: 2048
29
- stft_normalized: False
30
- mask_estimator_depth: 3
31
- multi_stft_resolution_loss_weight: 1.0
32
- multi_stft_resolutions_window_sizes: !!python/tuple
33
- - 4096
34
- - 2048
35
- - 1024
36
- - 512
37
- - 256
38
- multi_stft_hop_size: 147
39
- multi_stft_normalized: False
40
-
41
- training:
42
- batch_size: 1
43
- gradient_accumulation_steps: 2
44
- grad_clip: 0
45
- instruments:
46
- - vocals
47
- - instruments
48
- lr: 1.0
49
- patience: 2
50
- reduce_factor: 0.9999999
51
- target_instrument: vocals
52
- num_epochs: 100000
53
- num_steps: 10
54
- augmentation: false # enable augmentations by audiomentations and pedalboard
55
- augmentation_type: true
56
- use_mp3_compress: false # Deprecated
57
- augmentation_mix: true # Mix several stems of the same type with some probability
58
- augmentation_loudness: true # randomly change loudness of each stem
59
- augmentation_loudness_type: 1 # Type 1 or 2
60
- augmentation_loudness_min: 0.25
61
- augmentation_loudness_max: 1
62
- q: 0.99
63
- coarse_loss_clip: false
64
- ema_momentum: 0.9995
65
- optimizer: prodigy
66
- other_fix: true # it's needed for checking on multisong dataset if other is actually instrumental
67
- use_amp: true # enable or disable usage of mixed precision (float16) - usually it must be true
68
-
69
- augmentations:
70
- enable: true # enable or disable all augmentations (to fast disable if needed)
71
- loudness: true # randomly change loudness of each stem on the range (loudness_min; loudness_max)
72
- loudness_min: 0.01
73
- loudness_max: 1.5
74
- mixup: true # mix several stems of same type with some probability (only works for dataset types: 1, 2, 3)
75
- mixup_probs: !!python/tuple # 2 additional stems of the same type (1st with prob 0.2, 2nd with prob 0.02)
76
- - 1
77
- - 0.1
78
- mixup_loudness_min: 0.25
79
- mixup_loudness_max: 1
80
-
81
- # apply mp3 compression to mixture only (emulate downloading mp3 from internet)
82
- mp3_compression_on_mixture: 0
83
- mp3_compression_on_mixture_bitrate_min: 32
84
- mp3_compression_on_mixture_bitrate_max: 320
85
- mp3_compression_on_mixture_backend: "lameenc"
86
-
87
- all:
88
- channel_shuffle: 0.5 # Set 0 or lower to disable
89
- random_inverse: 0.1 # inverse track (better lower probability)
90
- random_polarity: 0.5 # polarity change (multiply waveform to -1)
91
- mp3_compression: 0.01
92
- mp3_compression_min_bitrate: 32
93
- mp3_compression_max_bitrate: 320
94
- mp3_compression_backend: "lameenc"
95
-
96
- # pedalboard reverb block
97
- pedalboard_reverb: 0.7
98
- pedalboard_reverb_room_size_min: 0.4
99
- pedalboard_reverb_room_size_max: 0.9
100
- pedalboard_reverb_damping_min: 0.3
101
- pedalboard_reverb_damping_max: 0.9
102
- pedalboard_reverb_wet_level_min: 0.4
103
- pedalboard_reverb_wet_level_max: 0.9
104
- pedalboard_reverb_dry_level_min: 0.1
105
- pedalboard_reverb_dry_level_max: 0.9
106
- pedalboard_reverb_width_min: 0.9
107
- pedalboard_reverb_width_max: 1.0
108
-
109
- # pedalboard chorus block
110
- pedalboard_chorus: 0.3
111
- pedalboard_chorus_rate_hz_min: 1.0
112
- pedalboard_chorus_rate_hz_max: 7.0
113
- pedalboard_chorus_depth_min: 0.25
114
- pedalboard_chorus_depth_max: 0.95
115
- pedalboard_chorus_centre_delay_ms_min: 3
116
- pedalboard_chorus_centre_delay_ms_max: 10
117
- pedalboard_chorus_feedback_min: 0.0
118
- pedalboard_chorus_feedback_max: 0.5
119
- pedalboard_chorus_mix_min: 0.1
120
- pedalboard_chorus_mix_max: 0.9
121
-
122
- # pedalboard phazer block
123
- pedalboard_phazer: 0.2
124
- pedalboard_phazer_rate_hz_min: 1.0
125
- pedalboard_phazer_rate_hz_max: 10.0
126
- pedalboard_phazer_depth_min: 0.25
127
- pedalboard_phazer_depth_max: 0.95
128
- pedalboard_phazer_centre_frequency_hz_min: 200
129
- pedalboard_phazer_centre_frequency_hz_max: 12000
130
- pedalboard_phazer_feedback_min: 0.0
131
- pedalboard_phazer_feedback_max: 0.5
132
- pedalboard_phazer_mix_min: 0.1
133
- pedalboard_phazer_mix_max: 0.9
134
-
135
- # pedalboard distortion block
136
- pedalboard_distortion: 0.2
137
- pedalboard_distortion_drive_db_min: 1.0
138
- pedalboard_distortion_drive_db_max: 12
139
-
140
- # pedalboard pitch shift block
141
- pedalboard_pitch_shift: 0
142
- pedalboard_pitch_shift_semitones_min: -7
143
- pedalboard_pitch_shift_semitones_max: 7
144
-
145
- # pedalboard resample block
146
- pedalboard_resample: 0.3
147
- pedalboard_resample_target_sample_rate_min: 8000
148
- pedalboard_resample_target_sample_rate_max: 44100
149
-
150
- # pedalboard bitcrash block
151
- pedalboard_bitcrash: 0.1
152
- pedalboard_bitcrash_bit_depth_min: 8
153
- pedalboard_bitcrash_bit_depth_max: 16
154
-
155
- # pedalboard mp3 compressor block
156
- pedalboard_mp3_compressor: 0
157
- pedalboard_mp3_compressor_pedalboard_mp3_compressor_min: 0
158
- pedalboard_mp3_compressor_pedalboard_mp3_compressor_max: 9.999
159
-
160
- vocals:
161
- pitch_shift: 0.7
162
- pitch_shift_min_semitones: -6
163
- pitch_shift_max_semitones: 6
164
- seven_band_parametric_eq: 0.45
165
- seven_band_parametric_eq_min_gain_db: -80
166
- seven_band_parametric_eq_max_gain_db: 3
167
- tanh_distortion: 0.3
168
- tanh_distortion_min: 0.01
169
- tanh_distortion_max: 0.7
170
- other:
171
- pitch_shift: 0.5
172
- pitch_shift_min_semitones: -12
173
- pitch_shift_max_semitones: 12
174
- gaussian_noise: 0.5
175
- gaussian_noise_min_amplitude: 0.01
176
- gaussian_noise_max_amplitude: 0.5
177
- time_stretch: 0.2
178
- time_stretch_min_rate: 0.125
179
- time_stretch_max_rate: 1.0
180
-
181
- loss_multistft:
182
- fft_sizes:
183
- - 1024
184
- - 2048
185
- - 4096
186
- hop_sizes:
187
- - 512
188
- - 1024
189
- - 2048
190
- win_lengths:
191
- - 1024
192
- - 2048
193
- - 4096
194
- window: "hann_window"
195
- scale: "mel"
196
- n_bins: 128
197
- sample_rate: 44100
198
- perceptual_weighting: true
199
- w_sc: 3.0
200
- w_log_mag: 3.0
201
- w_lin_mag: 2.0
202
- w_phs: 3.0
203
- mag_distance: "L1"
204
-
205
- inference:
206
- batch_size: 4
207
- dim_t: 1101
208
- num_overlap: 4
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
models/Roformer/MelBand/by_Aname/melband_roformer_kim_vocals_fullness_v1_by_aname.ckpt DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:9d0662af510f63fe48bdc91035951c1a7ae3b41ac9ae92cf7ec88fe9d6a6cb6d
3
- size 913090472
 
 
 
 
models/Roformer/MelBand/by_Aname/melband_roformer_kim_vocals_fullness_v2_by_aname.ckpt DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:bc4c02112d53fea925bfe362918a9cbea10b3c0893aa40506aa82874ad03138c
3
- size 913090472
 
 
 
 
models/Roformer/MelBand/by_Aname/melband_roformer_kim_vocals_v1_by_aname.ckpt DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:696825ec20f6bc48add7443000def04bb1736c1098784be7cdf0756a140e9621
3
- size 913106158
 
 
 
 
models/Roformer/MelBand/by_Aname/melband_roformer_kim_vocals_v2_by_aname.ckpt DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:58b1a07034e74e169e1a332c15fe63fb8da117fbeac580dbab06ad99ddb27702
3
- size 913090472
 
 
 
 
models/Roformer/MelBand/by_Aname/melband_roformer_kim_vocals_v3_by_aname.ckpt DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:acf6708e4e9ead350abdeedd9f3385c5e7c08281eba24bd59c8a5fe63a446082
3
- size 913106158
 
 
 
 
models/Roformer/MelBand/by_Aname/melband_roformer_vocals_bleedness_by_aname.ckpt DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:614bcc380bafe7a39ad1c451103dbe6a487886102c6b34c0561b5d8a4cec1286
3
- size 1708534246