listra92 commited on
Commit
0658047
·
verified ·
1 Parent(s): 7901725

Upload melbandroformers2Fvoc_gabox.yaml

Browse files
misc/melbandroformers2Fvoc_gabox.yaml CHANGED
@@ -1,5 +1,5 @@
1
  audio:
2
- chunk_size: 352800
3
  dim_f: 1024
4
  dim_t: 256
5
  hop_length: 441
@@ -22,7 +22,7 @@ model:
22
  ff_dropout: 0
23
  flash_attn: True
24
  dim_freqs_in: 1025
25
- sample_rate: 44100 # needed for mel filter bank from librosa
26
  stft_n_fft: 2048
27
  stft_hop_length: 441
28
  stft_win_length: 2048
@@ -39,13 +39,16 @@ model:
39
  multi_stft_normalized: False
40
 
41
  training:
 
 
 
42
  instruments:
43
- - Vocals
44
- - Instrumental
45
- target_instrument: Vocals
 
46
 
47
  inference:
48
- batch_size: 1
49
  dim_t: 1101
50
- num_overlap: 1
51
- chunk_size: 352800
 
1
  audio:
2
+ chunk_size: 661500
3
  dim_f: 1024
4
  dim_t: 256
5
  hop_length: 441
 
22
  ff_dropout: 0
23
  flash_attn: True
24
  dim_freqs_in: 1025
25
+ sample_rate: 44100
26
  stft_n_fft: 2048
27
  stft_hop_length: 441
28
  stft_win_length: 2048
 
39
  multi_stft_normalized: False
40
 
41
  training:
42
+ batch_size: 1
43
+ gradient_accumulation_steps: 1
44
+ grad_clip: 0
45
  instruments:
46
+ - vocals
47
+ - other
48
+ target_instrument: vocals
49
+ use_amp: true
50
 
51
  inference:
52
+ batch_size: 4
53
  dim_t: 1101
54
+ num_overlap: 4