jorisvaneyghen commited on
Commit
7804c9b
·
verified ·
1 Parent(s): 2e695f1

trained from pretrained

Browse files
Files changed (2) hide show
  1. config_jazz_scnet.yaml +83 -0
  2. model_jazz_scnet.ckpt +3 -0
config_jazz_scnet.yaml ADDED
@@ -0,0 +1,83 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ audio:
2
+ chunk_size: 485100 # 44100 * 11
3
+ num_channels: 2
4
+ sample_rate: 44100
5
+ min_mean_abs: 0.000
6
+
7
+ model:
8
+ sources:
9
+ - drums
10
+ - bass
11
+ - piano
12
+ - other
13
+ audio_channels: 2
14
+ dims:
15
+ - 4
16
+ - 32
17
+ - 64
18
+ - 128
19
+ nfft: 4096
20
+ hop_size: 1024
21
+ win_size: 4096
22
+ normalized: True
23
+ band_SR:
24
+ - 0.175
25
+ - 0.392
26
+ - 0.433
27
+ band_stride:
28
+ - 1
29
+ - 4
30
+ - 16
31
+ band_kernel:
32
+ - 3
33
+ - 4
34
+ - 16
35
+ conv_depths:
36
+ - 3
37
+ - 2
38
+ - 1
39
+ compress: 4
40
+ conv_kernel: 3
41
+ num_dplayer: 6
42
+ expand: 1
43
+
44
+ training:
45
+ batch_size: 10
46
+ gradient_accumulation_steps: 1
47
+ grad_clip: 0
48
+ instruments:
49
+ - drums
50
+ - bass
51
+ - piano
52
+ - other
53
+ lr: 5.0e-04
54
+ patience: 2
55
+ reduce_factor: 0.95
56
+ target_instrument: null
57
+ num_epochs: 1000
58
+ num_steps: 1000
59
+ q: 0.95
60
+ coarse_loss_clip: true
61
+ ema_momentum: 0.999
62
+ optimizer: adam
63
+ other_fix: false # it's needed for checking on multisong dataset if other is actually instrumental
64
+ use_amp: true # enable or disable usage of mixed precision (float16) - usually it must be true
65
+
66
+ augmentations:
67
+ enable: true # enable or disable all augmentations (to fast disable if needed)
68
+ loudness: true # randomly change loudness of each stem on the range (loudness_min; loudness_max)
69
+ loudness_min: 0.5
70
+ loudness_max: 1.5
71
+ mixup: true # mix several stems of same type with some probability (only works for dataset types: 1, 2, 3)
72
+ mixup_probs:
73
+ !!python/tuple # 2 additional stems of the same type (1st with prob 0.2, 2nd with prob 0.02)
74
+ - 0.2
75
+ - 0.02
76
+ mixup_loudness_min: 0.5
77
+ mixup_loudness_max: 1.5
78
+
79
+ inference:
80
+ batch_size: 4
81
+ dim_t: 256
82
+ num_overlap: 4
83
+ normalize: true
model_jazz_scnet.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d35547b4ad0061147ee712a3349acb8a73ede46d8b803dc1e2dc8715880cfc61
3
+ size 42458066