File size: 2,066 Bytes
94ce22b
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
global:
  sr:                   44100     # Hz
  segment:              11.85     # seconds
  shift:                2         # seconds
  sample_rate:          44100     # Hz
  n_workers:            16
  prefetch_factor:      6


inference_models:
  kick:     'pretrained_larsnet_models/kick/pretrained_kick_unet.pth'
  snare:    'pretrained_larsnet_models/snare/pretrained_snare_unet.pth'
  toms:     'pretrained_larsnet_models/toms/pretrained_toms_unet.pth'
  hihat:    'pretrained_larsnet_models/hihat/pretrained_hihat_unet.pth'
  cymbals:  'pretrained_larsnet_models/cymbals/pretrained_cymbals_unet.pth'


data_augmentation:
  augmentation_prob:          0.5
  kit_swap_augment_prob:      0.5
  doubling_augment_prob:      0.3
  pitch_shift_augment_prob:   0.3
  saturation_augment_prob:    0.3
  channel_swap_augment_prob:  0.5
  remix_augment_prob:         0.3


kick:
  F:                    2048
  T:                    512
  batch_size:           24
  learning_rate:        1e-4
  epochs:               22
  training_mode:        'stft'
  model_id:             'default_kick_unet'


snare:
  F:                    2048
  T:                    512
  batch_size:           24
  learning_rate:        1e-4
  epochs:               22
  training_mode:        'stft'
  model_id:             'default_snare_unet'


toms:
  F:                    2048
  T:                    512
  batch_size:           24
  learning_rate:        1e-4
  epochs:               22
  training_mode:        'stft'
  model_id:             'default_toms_unet'


hihat:
  F:                    2048
  T:                    512
  batch_size:           24
  learning_rate:        1e-4
  epochs:               22
  training_mode:        'stft'
  model_id:             'default_hihat_unet'


cymbals:
  F:                    2048
  T:                    512
  batch_size:           24
  learning_rate:        1e-4
  epochs:               22
  training_mode:        'stft'
  model_id:             'default_cymbals_unet'