shethjenil commited on
Commit
0013177
·
verified ·
1 Parent(s): 7a459a0

Upload folder using huggingface_hub

Browse files
Files changed (41) hide show
  1. .gitattributes +10 -0
  2. omnizart/beat/beat_blstm/configurations.yaml +58 -0
  3. omnizart/beat/beat_blstm/saved_model.pb +3 -0
  4. omnizart/beat/beat_blstm/variables/variables.data-00000-of-00001 +3 -0
  5. omnizart/beat/beat_blstm/variables/variables.index +0 -0
  6. omnizart/chord/chord_v1/configurations.yaml +119 -0
  7. omnizart/chord/chord_v1/saved_model.pb +3 -0
  8. omnizart/chord/chord_v1/variables/variables.data-00000-of-00001 +3 -0
  9. omnizart/chord/chord_v1/variables/variables.index +0 -0
  10. omnizart/drum/drum_keras/configurations.yaml +115 -0
  11. omnizart/drum/drum_keras/saved_model.pb +3 -0
  12. omnizart/drum/drum_keras/variables/variables.data-00000-of-00001 +3 -0
  13. omnizart/drum/drum_keras/variables/variables.index +0 -0
  14. omnizart/music/music_note_stream/configurations.yaml +86 -0
  15. omnizart/music/music_note_stream/saved_model.pb +3 -0
  16. omnizart/music/music_note_stream/variables/variables.data-00000-of-00001 +3 -0
  17. omnizart/music/music_note_stream/variables/variables.index +0 -0
  18. omnizart/music/music_piano-v2/configurations.yaml +88 -0
  19. omnizart/music/music_piano-v2/saved_model.pb +3 -0
  20. omnizart/music/music_piano-v2/variables/variables.data-00000-of-00001 +3 -0
  21. omnizart/music/music_piano-v2/variables/variables.index +0 -0
  22. omnizart/music/music_piano/configurations.yaml +166 -0
  23. omnizart/music/music_piano/saved_model.pb +3 -0
  24. omnizart/music/music_piano/variables/variables.data-00000-of-00001 +3 -0
  25. omnizart/music/music_piano/variables/variables.index +0 -0
  26. omnizart/music/music_pop/configurations.yaml +88 -0
  27. omnizart/music/music_pop/saved_model.pb +3 -0
  28. omnizart/music/music_pop/variables/variables.data-00000-of-00001 +3 -0
  29. omnizart/music/music_pop/variables/variables.index +0 -0
  30. omnizart/patch_cnn/patch_cnn_melody/configurations.yaml +118 -0
  31. omnizart/patch_cnn/patch_cnn_melody/saved_model.pb +3 -0
  32. omnizart/patch_cnn/patch_cnn_melody/variables/variables.data-00000-of-00001 +3 -0
  33. omnizart/patch_cnn/patch_cnn_melody/variables/variables.index +0 -0
  34. omnizart/vocal/vocal_contour/configurations.yaml +42 -0
  35. omnizart/vocal/vocal_contour/saved_model.pb +3 -0
  36. omnizart/vocal/vocal_contour/variables/variables.data-00000-of-00001 +3 -0
  37. omnizart/vocal/vocal_contour/variables/variables.index +0 -0
  38. omnizart/vocal/vocal_semi/configurations.yaml +150 -0
  39. omnizart/vocal/vocal_semi/saved_model.pb +3 -0
  40. omnizart/vocal/vocal_semi/variables/variables.data-00000-of-00001 +3 -0
  41. omnizart/vocal/vocal_semi/variables/variables.index +0 -0
.gitattributes CHANGED
@@ -35,3 +35,13 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
  basicpitch/nmp/variables/variables.data-00000-of-00001 filter=lfs diff=lfs merge=lfs -text
37
  basicpitch/nmp_vamp_plugin/ircambasicpitch.so filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
 
 
 
 
 
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
  basicpitch/nmp/variables/variables.data-00000-of-00001 filter=lfs diff=lfs merge=lfs -text
37
  basicpitch/nmp_vamp_plugin/ircambasicpitch.so filter=lfs diff=lfs merge=lfs -text
38
+ omnizart/beat/beat_blstm/variables/variables.data-00000-of-00001 filter=lfs diff=lfs merge=lfs -text
39
+ omnizart/chord/chord_v1/variables/variables.data-00000-of-00001 filter=lfs diff=lfs merge=lfs -text
40
+ omnizart/drum/drum_keras/variables/variables.data-00000-of-00001 filter=lfs diff=lfs merge=lfs -text
41
+ omnizart/music/music_note_stream/variables/variables.data-00000-of-00001 filter=lfs diff=lfs merge=lfs -text
42
+ omnizart/music/music_piano/variables/variables.data-00000-of-00001 filter=lfs diff=lfs merge=lfs -text
43
+ omnizart/music/music_piano-v2/variables/variables.data-00000-of-00001 filter=lfs diff=lfs merge=lfs -text
44
+ omnizart/music/music_pop/variables/variables.data-00000-of-00001 filter=lfs diff=lfs merge=lfs -text
45
+ omnizart/patch_cnn/patch_cnn_melody/variables/variables.data-00000-of-00001 filter=lfs diff=lfs merge=lfs -text
46
+ omnizart/vocal/vocal_contour/variables/variables.data-00000-of-00001 filter=lfs diff=lfs merge=lfs -text
47
+ omnizart/vocal/vocal_semi/variables/variables.data-00000-of-00001 filter=lfs diff=lfs merge=lfs -text
omnizart/beat/beat_blstm/configurations.yaml ADDED
@@ -0,0 +1,58 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ General:
2
+ CheckpointPath:
3
+ Value:
4
+ BLSTM: checkpoints/beat/beat_blstm
5
+ Dataset:
6
+ Settings:
7
+ FeatureSavePath:
8
+ Value: +
9
+ SavePath:
10
+ Value: ./
11
+ Feature:
12
+ Settings:
13
+ TimeUnit:
14
+ Value: 0.01
15
+ Inference:
16
+ Settings:
17
+ BeatThreshold:
18
+ Value: 0.5
19
+ DownBeatThreshold:
20
+ Value: 0.3
21
+ MinDistance:
22
+ Value: 0.3
23
+ Model:
24
+ Settings:
25
+ AttnHiddenDim:
26
+ Value: 256
27
+ LstmHiddenDim:
28
+ Value: 25
29
+ ModelType:
30
+ Value: blstm
31
+ NumLstmLayers:
32
+ Value: 2
33
+ SavePath:
34
+ Value: ./checkpoints/beat
35
+ SavePrefix:
36
+ Value: beat
37
+ Timesteps:
38
+ Value: 1000
39
+ Training:
40
+ Settings:
41
+ BatchSize:
42
+ Value: 64
43
+ DownBeatWeight:
44
+ Value: 5
45
+ EarlyStop:
46
+ Value: 4
47
+ Epoch:
48
+ Value: 10
49
+ InitLearningRate:
50
+ Value: 0.001
51
+ Steps:
52
+ Value: 2000
53
+ ValBatchSize:
54
+ Value: 64
55
+ ValSteps:
56
+ Value: 200
57
+ TranscriptionMode:
58
+ Value: BLSTM
omnizart/beat/beat_blstm/saved_model.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1a0bff208bd559b49df510f2e5177e28b755a29ae36ac690377e00529971417b
3
+ size 5077079
omnizart/beat/beat_blstm/variables/variables.data-00000-of-00001 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:673692c2d4cff145bcaad5396d61e480aa442c86f1ac928be2da18568a306057
3
+ size 400241555
omnizart/beat/beat_blstm/variables/variables.index ADDED
Binary file (1.23 kB). View file
 
omnizart/chord/chord_v1/configurations.yaml ADDED
@@ -0,0 +1,119 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+
2
+ General:
3
+ TranscriptionMode:
4
+ Description: Mode of transcription by executing the `omnizart_fix chord transcribe` command.
5
+ Type: String
6
+ Value: ChordV1
7
+ CheckpointPath:
8
+ Description: Path to the pre-trained models.
9
+ Type: Map
10
+ SubType: [String, String]
11
+ Value:
12
+ ChordV1: checkpoints/chord/chord_v1
13
+ Feature:
14
+ Description: Default settings of feature extraction for drum transcription.
15
+ Settings:
16
+ SegmentWidth:
17
+ Description: Width of segments. Each frame last for 0.046 seconds, and thus each segment would last for around 0.5 seconds.
18
+ Type: Integer
19
+ Value: 21
20
+ SegmentHop:
21
+ Description: Hop size of the segment.
22
+ Type: Integer
23
+ Value: 5
24
+ NumSteps:
25
+ Description: Number of total steps. Default setting would have around 23 seconds.
26
+ Type: Integer
27
+ Value: 100
28
+ Dataset:
29
+ Description: Settings of datasets.
30
+ Settings:
31
+ SavePath:
32
+ Description: Path for storing the downloaded datasets.
33
+ Type: String
34
+ Value: ./
35
+ FeatureSavePath:
36
+ Description: Path for storing the extracted feature. Default to the path under the dataset folder.
37
+ Type: String
38
+ Value: +
39
+ Model:
40
+ Description: Default settings of training / testing the model.
41
+ Settings:
42
+ SavePrefix:
43
+ Description: Prefix of the trained model's name to be saved.
44
+ Type: String
45
+ Value: chord
46
+ SavePath:
47
+ Description: Path to save the trained model.
48
+ Type: String
49
+ Value: ./checkpoints/chord
50
+ NumEncAttnBlocks:
51
+ Description: Number of attention blocks for encoder.
52
+ Type: Integer
53
+ Value: 2
54
+ NumDecAttnBlocks:
55
+ Description: Number of attention blocks for decoder.
56
+ Type: Integer
57
+ Value: 2
58
+ FreqSize:
59
+ Description: Available size on the frequency axis to be seen.
60
+ Type: Integer
61
+ Value: 24
62
+ EncInputEmbSize:
63
+ Description: Embedding size of the encoder's input.
64
+ Type: Integer
65
+ Value: 512
66
+ DecInputEmbSize:
67
+ Description: Embedding size of the decoder's input.
68
+ Type: Integer
69
+ Value: 512
70
+ DropoutRate:
71
+ Description: Dropout rate of all dropout layers.
72
+ Type: Float
73
+ Value: 0.6
74
+ AnnealingRate:
75
+ Description: To be added...
76
+ Type: Float
77
+ Value: 1.1
78
+ Inference:
79
+ Description: Default settings when infering notes.
80
+ Settings:
81
+ MinDura:
82
+ Description: Minimum duration (in seconds) for each chord. If shorter than expected, will append the duration to the previous chord.
83
+ Type: Float
84
+ Value: 0.1
85
+ Training:
86
+ Description: Hyper parameters for training
87
+ Settings:
88
+ Epoch:
89
+ Description: Maximum number of epochs for training.
90
+ Type: Integer
91
+ Value: 10
92
+ Steps:
93
+ Description: Number of training steps for each epoch.
94
+ Type: Integer
95
+ Value: 1000
96
+ ValSteps:
97
+ Description: Number of validation steps after each training epoch.
98
+ Type: Integer
99
+ Value: 500
100
+ BatchSize:
101
+ Description: Batch size of each training step.
102
+ Type: Integer
103
+ Value: 32
104
+ ValBatchSize:
105
+ Description: Batch size of each validation step.
106
+ Type: Integer
107
+ Value: 32
108
+ EarlyStop:
109
+ Description: Terminate the training if the validation performance doesn't imrove after n epochs.
110
+ Type: Integer
111
+ Value: 4
112
+ InitLearningRate:
113
+ Descriptoin: Initial learning rate.
114
+ Type: Float
115
+ Value: 0.0001
116
+ LearningRateDecay:
117
+ Description: Decaying rate of learning rate per epoch.
118
+ Type: Float
119
+ Value: 0.96
omnizart/chord/chord_v1/saved_model.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:489a3db29d528d67d1b7743a0301a4ab81f0803bfcbb0e819615eb64ec67203b
3
+ size 23098326
omnizart/chord/chord_v1/variables/variables.data-00000-of-00001 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ba35defa2a043c3cf9d3ef9512a83a6fe6bb62cd247026de50f58bdc0e71317d
3
+ size 44242072
omnizart/chord/chord_v1/variables/variables.index ADDED
Binary file (7.13 kB). View file
 
omnizart/drum/drum_keras/configurations.yaml ADDED
@@ -0,0 +1,115 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+
2
+ General:
3
+ TranscriptionMode:
4
+ Description: Mode of transcription by executing the `omnizart_fix transribe drum` command.
5
+ Type: String
6
+ Value: keras
7
+ CheckpointPath:
8
+ Description: Path to the pre-trained models.
9
+ Type: Map
10
+ SubType: [String, String]
11
+ Value:
12
+ keras: ./checkpoints/drum/drum_keras
13
+ Feature:
14
+ Description: Default settings of feature extraction for drum transcription.
15
+ Settings:
16
+ SamplingRate:
17
+ Description: Adjust input sampling rate to this value.
18
+ Type: Integer
19
+ Value: 44100
20
+ PaddingSeconds:
21
+ Description: Padding length to the begin and the end of the raw audio data.
22
+ Type: Float
23
+ Value: 1.0
24
+ LowestNote:
25
+ Description: Lowest MIDI note number to be considered.
26
+ Type: Integer
27
+ Value: 16
28
+ NumberOfNotes:
29
+ Description: Number of total notes to extract.
30
+ Type: Integer
31
+ Value: 120
32
+ HopSize:
33
+ Description: Hop size for computing CQT feature.
34
+ Type: Integer
35
+ Value: 256
36
+ MiniBeatPerBar:
37
+ Description: Number of mini beats in a single 4/4 measure.
38
+ Type: Integer
39
+ Value: 32
40
+ MiniBeatPerSegment:
41
+ Description: Number of mini beats in a single 4/4 measure.
42
+ Type: Integer
43
+ Value: 4
44
+ Dataset:
45
+ Description: Settings of datasets.
46
+ Settings:
47
+ SavePath:
48
+ Description: Path for storing the downloaded datasets.
49
+ Type: String
50
+ Value: ./
51
+ FeatureSavePath:
52
+ Description: Path for storing the extracted feature. Default to the path under the dataset folder.
53
+ Type: String
54
+ Value: +
55
+ Model:
56
+ Description: Default settings of training / testing the model.
57
+ Settings:
58
+ SavePrefix:
59
+ Description: Prefix of the trained model's name to be saved.
60
+ Type: String
61
+ Value: drum
62
+ SavePath:
63
+ Description: Path to save the trained model.
64
+ Type: String
65
+ Value: ./checkpoints/drum
66
+ Inference:
67
+ Description: Default settings when infereing notes.
68
+ Settings:
69
+ BassDrumTh:
70
+ Description: Threshold for the bass drum.
71
+ Type: Float
72
+ Value: 0.85
73
+ SnareTh:
74
+ Description: Threshold for the snare.
75
+ Type: Float
76
+ Value: 1.2
77
+ HihatTh:
78
+ Description: Threshold for the hihat.
79
+ Type: Float
80
+ Value: 0.17
81
+ Training:
82
+ Description: Hyper parameters for training
83
+ Settings:
84
+ Epoch:
85
+ Description: Maximum number of epochs for training.
86
+ Type: Integer
87
+ Value: 50
88
+ Steps:
89
+ Description: Number of training steps for each epoch.
90
+ Type: Integer
91
+ Value: 1000
92
+ ValSteps:
93
+ Description: Number of validation steps after each training epoch.
94
+ Type: Integer
95
+ Value: 100
96
+ BatchSize:
97
+ Description: Batch size of each training step.
98
+ Type: Integer
99
+ Value: 32
100
+ ValBatchSize:
101
+ Description: Batch size of each validation step.
102
+ Type: Integer
103
+ Value: 32
104
+ EarlyStop:
105
+ Description: Terminate the training if the validation performance doesn't imrove after n epochs.
106
+ Type: Integer
107
+ Value: 6
108
+ InitLearningRate:
109
+ Descriptoin: Initial learning rate.
110
+ Type: Float
111
+ Value: 0.00002
112
+ ResBlockNum:
113
+ Description: Number of residual blocks.
114
+ Type: Integer
115
+ Value: 3
omnizart/drum/drum_keras/saved_model.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6536f2fd67472cf8fcaea89888410eb6c09b4e3ac72664cb9fffe7441aa6559b
3
+ size 1829175
omnizart/drum/drum_keras/variables/variables.data-00000-of-00001 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9e5105215ec8bdee5ebba57c2eef8655a310de99da9f3169b3f857e2185ab464
3
+ size 31090686
omnizart/drum/drum_keras/variables/variables.index ADDED
Binary file (5.02 kB). View file
 
omnizart/music/music_note_stream/configurations.yaml ADDED
@@ -0,0 +1,86 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ General:
2
+ CheckpointPath:
3
+ Value:
4
+ Piano: ./checkpoints/music/music_piano
5
+ Pop: ./checkpoints/music/music_pop
6
+ Dataset:
7
+ Settings:
8
+ FeatureSavePath:
9
+ Value: +
10
+ FeatureType:
11
+ Value: CFP
12
+ SavePath:
13
+ Value: ./
14
+ Feature:
15
+ Settings:
16
+ BinsPerOctave:
17
+ Value: 48
18
+ FrequencyCenter:
19
+ Value: 27.5
20
+ FrequencyResolution:
21
+ Value: 2.0
22
+ Gamma:
23
+ Value:
24
+ - 0.24
25
+ - 0.6
26
+ - 1.0
27
+ Harmonic:
28
+ Value: false
29
+ HarmonicNumber:
30
+ Value: 6
31
+ HopSize:
32
+ Value: 0.02
33
+ SamplingRate:
34
+ Value: 44100
35
+ TimeCenter:
36
+ Value: 0.00022287
37
+ WindowSize:
38
+ Value: 7939
39
+ Inference:
40
+ Settings:
41
+ DuraTh:
42
+ Value: 0.5
43
+ FrameTh:
44
+ Value: 0.5
45
+ InstTh:
46
+ Value: 1.1
47
+ MinLength:
48
+ Value: 0.05
49
+ OnsetTh:
50
+ Value: 6.0
51
+ Model:
52
+ Settings:
53
+ ModelType:
54
+ Value: attn
55
+ SavePath:
56
+ Value: ./checkpoints/music
57
+ SavePrefix:
58
+ Value: music
59
+ Training:
60
+ Settings:
61
+ BatchSize:
62
+ Value: 8
63
+ Channels:
64
+ Value:
65
+ - Spec
66
+ - Ceps
67
+ EarlyStop:
68
+ Value: 6
69
+ Epoch:
70
+ Value: 20
71
+ LabelType:
72
+ Value: note-stream
73
+ LossFunction:
74
+ Value: smooth
75
+ Steps:
76
+ Value: 3000
77
+ Timesteps:
78
+ Value: 128
79
+ ValBatchSize:
80
+ Value: 8
81
+ ValSteps:
82
+ Value: 500
83
+ FeatureNum:
84
+ Value: 352
85
+ TranscriptionMode:
86
+ Value: Stream
omnizart/music/music_note_stream/saved_model.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b629d1fe06db9bb056d74857376616cdec7d67884bec4ba08aa48235989e7ea1
3
+ size 4448469
omnizart/music/music_note_stream/variables/variables.data-00000-of-00001 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a3f1dce36c255b2e34d69e1faba1e0822723240880b5fdd444613fdb2f29eb15
3
+ size 33495027
omnizart/music/music_note_stream/variables/variables.index ADDED
Binary file (18.4 kB). View file
 
omnizart/music/music_piano-v2/configurations.yaml ADDED
@@ -0,0 +1,88 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ General:
2
+ CheckpointPath:
3
+ Value:
4
+ Piano: checkpoints/music/music_piano
5
+ Pop: checkpoints/music/music_pop
6
+ Stream: checkpoints/music/music_note_stream
7
+ Dataset:
8
+ Settings:
9
+ FeatureSavePath:
10
+ Value: +
11
+ FeatureType:
12
+ Value: CFP
13
+ SavePath:
14
+ Value: ./
15
+ Feature:
16
+ Settings:
17
+ BinsPerOctave:
18
+ Value: 48
19
+ FrequencyCenter:
20
+ Value: 27.5
21
+ FrequencyResolution:
22
+ Value: 2.0
23
+ Gamma:
24
+ Value:
25
+ - 0.24
26
+ - 0.6
27
+ - 1.0
28
+ Harmonic:
29
+ Value: false
30
+ HarmonicNumber:
31
+ Value: 6
32
+ HopSize:
33
+ Value: 0.02
34
+ SamplingRate:
35
+ Value: 44100
36
+ TimeCenter:
37
+ Value: 0.00022287
38
+ WindowSize:
39
+ Value: 7939
40
+ Inference:
41
+ Settings:
42
+ DuraTh:
43
+ Value: 0.5
44
+ FrameTh:
45
+ Value: 0.5
46
+ InstTh:
47
+ Value: 1.1
48
+ MinLength:
49
+ Value: 0.05
50
+ OnsetTh:
51
+ Value: 4
52
+ Model:
53
+ Settings:
54
+ ModelType:
55
+ Value: aspp
56
+ SavePath:
57
+ Value: ./checkpoints/music
58
+ SavePrefix:
59
+ Value: music
60
+ Training:
61
+ Settings:
62
+ BatchSize:
63
+ Value: 16
64
+ Channels:
65
+ Value:
66
+ - Spec
67
+ - Ceps
68
+ - GCoS
69
+ EarlyStop:
70
+ Value: 6
71
+ Epoch:
72
+ Value: 30
73
+ FeatureNum:
74
+ Value: 352
75
+ LabelType:
76
+ Value: note
77
+ LossFunction:
78
+ Value: smooth
79
+ Steps:
80
+ Value: 1500
81
+ Timesteps:
82
+ Value: 256
83
+ ValBatchSize:
84
+ Value: 8
85
+ ValSteps:
86
+ Value: 150
87
+ TranscriptionMode:
88
+ Value: Piano
omnizart/music/music_piano-v2/saved_model.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2244e3929e88ae32ad32ad46541eab7ce6803d34c6c37cb9445b50ffc89e9281
3
+ size 4402822
omnizart/music/music_piano-v2/variables/variables.data-00000-of-00001 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a3316d5fed8054bb7f6aa18021d6787484808894a1eceacea0f9a9f2fe1fb684
3
+ size 84656908
omnizart/music/music_piano-v2/variables/variables.index ADDED
Binary file (21.1 kB). View file
 
omnizart/music/music_piano/configurations.yaml ADDED
@@ -0,0 +1,166 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Self-documented configurable settings, with description, type hint, and available
2
+ # options. All the parameters can be overriden by another specified configuration file
3
+ # with selected parameters.
4
+
5
+
6
+ General:
7
+ TranscriptionMode:
8
+ Description: Mode of transcription by executing the `omnizart_fix transribe music` command.
9
+ Type: String
10
+ Value: Piano
11
+ CheckpointPath:
12
+ Description: Path to the pre-trained models.
13
+ Type: Map
14
+ SubType: [String, String]
15
+ Value:
16
+ Piano: ./checkpoints/music/music_piano
17
+ Pop: ./checkpoints/music/music_pop
18
+ Stream: ./checkpoints/music/music_note_stream
19
+ Feature:
20
+ Description: Default settings of feature extraction
21
+ Settings:
22
+ HopSize:
23
+ Description: Hop size in seconds with respect to sampling rate.
24
+ Type: Float
25
+ Value: 0.02
26
+ SamplingRate:
27
+ Description: Adjust input sampling rate to this value.
28
+ Type: Integer
29
+ Value: 44100
30
+ WindowSize:
31
+ Type: Integer
32
+ Value: 7939
33
+ FrequencyResolution:
34
+ Type: Float
35
+ Value: 2.0
36
+ FrequencyCenter:
37
+ Description: Lowest frequency to extract.
38
+ Type: Float
39
+ Value: 27.5
40
+ TimeCenter:
41
+ Description: Highest frequency to extract (1/time_center).
42
+ Type: Float
43
+ Value: 0.00022287
44
+ Gamma:
45
+ Type: List
46
+ SubType: Float
47
+ Value: [0.24, 0.6, 1.0]
48
+ BinsPerOctave:
49
+ Description: Number of bins for each octave.
50
+ Type: Integer
51
+ Value: 48
52
+ HarmonicNumber:
53
+ Description: Number of harmonic bins of HCFP feature.
54
+ Type: Integer
55
+ Value: 6
56
+ Harmonic:
57
+ Description: Whether to use harmonic version of the input feature for training.
58
+ Type: Bool
59
+ Value: False
60
+ Dataset:
61
+ Description: Settings of datasets.
62
+ Settings:
63
+ SavePath:
64
+ Description: Path for storing the downloaded datasets.
65
+ Type: String
66
+ Value: ./
67
+ FeatureType:
68
+ Description: Type of feature to extract.
69
+ Type: String
70
+ Value: CFP
71
+ Choices: ["CFP", "HCFP"]
72
+ FeatureSavePath:
73
+ Description: Path for storing the extracted feature. Default to the path under the dataset folder.
74
+ Type: String
75
+ Value: +
76
+ Model:
77
+ Description: Default settings of training / testing the model.
78
+ Settings:
79
+ SavePrefix:
80
+ Description: Prefix of the trained model's name to be saved.
81
+ Type: String
82
+ Value: music
83
+ SavePath:
84
+ Description: Path to save the trained model.
85
+ Type: String
86
+ Value: ./checkpoints/music
87
+ ModelType:
88
+ Description: Default model type to be used for training
89
+ Type: String
90
+ Value: attn
91
+ Choices: ["aspp", "attn"]
92
+ Inference:
93
+ Description: Default settings when infering notes.
94
+ Settings:
95
+ MinLength:
96
+ Description: Minimum length of a note in seconds.
97
+ Type: Float
98
+ Value: 0.05
99
+ InstTh:
100
+ Description: Threshold for filtering instruments.
101
+ Type: Float
102
+ Value: 1.1
103
+ OnsetTh:
104
+ Description: Threshold of predicted onset channel.
105
+ Type: Float
106
+ Value: 4
107
+ DuraTh:
108
+ Description: Threshold of predicted duration channel.
109
+ Type: Float
110
+ Value: 0.5
111
+ FrameTh:
112
+ Description: Threshold of frame-level predictions.
113
+ Type: Float
114
+ Value: 0.5
115
+ Training:
116
+ Description: Parameters for training
117
+ Settings:
118
+ Epoch:
119
+ Description: Maximum number of epochs for training.
120
+ Type: Integer
121
+ Value: 20
122
+ Steps:
123
+ Description: Number of training steps for each epoch.
124
+ Type: Integer
125
+ Value: 3000
126
+ ValSteps:
127
+ Description: Number of validation steps after each training epoch.
128
+ Type: Integer
129
+ Value: 500
130
+ BatchSize:
131
+ Description: Batch size of each training step.
132
+ Type: Integer
133
+ Value: 8
134
+ ValBatchSize:
135
+ Description: Batchs size of each validation step.
136
+ Type: Integer
137
+ Value: 8
138
+ EarlyStop:
139
+ Description: Terminate the training if the validation performance doesn't imrove after n epochs.
140
+ Type: Integer
141
+ Value: 6
142
+ LossFunction:
143
+ Description: Loss function for computing the objectives.
144
+ Type: String
145
+ Value: smooth
146
+ Choices: ["smooth", "focal", "bce"]
147
+ LabelType:
148
+ Description: Determines the training target to be single- or multi-instrument scenario, and more options.
149
+ Type: String
150
+ Value: note
151
+ Choices: ["note-stream", "frame-stream", "note", "frame"]
152
+ Channels:
153
+ Description: Use different types of feature for training.
154
+ Type: List
155
+ SubType: String
156
+ Value: ["Spec", "Ceps"]
157
+ Choices: ["Spec", "GCoS", "Ceps"]
158
+ Timesteps:
159
+ Description: Length of time axis of the input feature.
160
+ Type: Integer
161
+ Value: 128
162
+ FeatureNum:
163
+ Description: The target size of feature dimension.
164
+ Type: Integer
165
+ Value: 384
166
+
omnizart/music/music_piano/saved_model.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f90191ba7c4dd251db9600119581a7a71daf35266da57097694861b325429e23
3
+ size 4027989
omnizart/music/music_piano/variables/variables.data-00000-of-00001 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bd93da1d0b4e2a59f8c473580380d2388df7ec86d0c8d7803a2863c530d005bf
3
+ size 50407445
omnizart/music/music_piano/variables/variables.index ADDED
Binary file (19.2 kB). View file
 
omnizart/music/music_pop/configurations.yaml ADDED
@@ -0,0 +1,88 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ General:
2
+ CheckpointPath:
3
+ Value:
4
+ Piano: checkpoints/music/music_piano
5
+ Pop: checkpoints/music/music_pop
6
+ Stream: checkpoints/music/music_note_stream
7
+ Dataset:
8
+ Settings:
9
+ FeatureSavePath:
10
+ Value: +
11
+ FeatureType:
12
+ Value: CFP
13
+ SavePath:
14
+ Value: ./
15
+ Feature:
16
+ Settings:
17
+ BinsPerOctave:
18
+ Value: 48
19
+ FrequencyCenter:
20
+ Value: 27.5
21
+ FrequencyResolution:
22
+ Value: 2.0
23
+ Gamma:
24
+ Value:
25
+ - 0.24
26
+ - 0.6
27
+ - 1.0
28
+ Harmonic:
29
+ Value: false
30
+ HarmonicNumber:
31
+ Value: 6
32
+ HopSize:
33
+ Value: 0.02
34
+ SamplingRate:
35
+ Value: 44100
36
+ TimeCenter:
37
+ Value: 0.00022287
38
+ WindowSize:
39
+ Value: 7939
40
+ Inference:
41
+ Settings:
42
+ DuraTh:
43
+ Value: 0.5
44
+ FrameTh:
45
+ Value: 0.5
46
+ InstTh:
47
+ Value: 1.1
48
+ MinLength:
49
+ Value: 0.05
50
+ OnsetTh:
51
+ Value: 6.0
52
+ Model:
53
+ Settings:
54
+ ModelType:
55
+ Value: attn
56
+ SavePath:
57
+ Value: ./checkpoints/music
58
+ SavePrefix:
59
+ Value: music
60
+ Training:
61
+ Settings:
62
+ BatchSize:
63
+ Value: 8
64
+ Channels:
65
+ Value:
66
+ - Spec
67
+ - Ceps
68
+ - GCoS
69
+ EarlyStop:
70
+ Value: 6
71
+ Epoch:
72
+ Value: 20
73
+ FeatureNum:
74
+ Value: 352
75
+ LabelType:
76
+ Value: pop-note-stream
77
+ LossFunction:
78
+ Value: smooth
79
+ Steps:
80
+ Value: 3000
81
+ Timesteps:
82
+ Value: 128
83
+ ValBatchSize:
84
+ Value: 8
85
+ ValSteps:
86
+ Value: 500
87
+ TranscriptionMode:
88
+ Value: Pop
omnizart/music/music_pop/saved_model.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:80374501dc49c07296419ca8850bbf8008d6fd76aa3f447ad91add482a9a42a7
3
+ size 4448052
omnizart/music/music_pop/variables/variables.data-00000-of-00001 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7cf77d6b5e95f4034d824049104cc93830a8a2c40399eb45dc8488ad072aeeb4
3
+ size 33498559
omnizart/music/music_pop/variables/variables.index ADDED
Binary file (18.4 kB). View file
 
omnizart/patch_cnn/patch_cnn_melody/configurations.yaml ADDED
@@ -0,0 +1,118 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+
2
+ General:
3
+ TranscriptionMode:
4
+ Description: Mode of transcription by executing the `omnizart_fix patch-cnn transcribe` command.
5
+ Type: String
6
+ Value: Melody
7
+ CheckpointPath:
8
+ Description: Path to the pre-trained models.
9
+ Type: Map
10
+ SubType: [String, String]
11
+ Value:
12
+ Melody: checkpoints/patch_cnn/patch_cnn_melody
13
+ Feature:
14
+ Description: Default settings of feature extraction
15
+ Settings:
16
+ PatchSize:
17
+ Description: Input size of feature dimension.
18
+ Type: Integer
19
+ Value: 25
20
+ PeakThreshold:
21
+ Description: Threshold used to filter out peaks with small value.
22
+ Type: Float
23
+ Value: 0.5
24
+ HopSize:
25
+ Description: Hop size in seconds with respect to sampling rate.
26
+ Type: Float
27
+ Value: 0.02
28
+ SamplingRate:
29
+ Description: Adjust input sampling rate to this value.
30
+ Type: Integer
31
+ Value: 16000
32
+ WindowSize:
33
+ Type: Integer
34
+ Value: 2049
35
+ FrequencyResolution:
36
+ Type: Float
37
+ Value: 2.0
38
+ FrequencyCenter:
39
+ Description: Lowest frequency to extract.
40
+ Type: Float
41
+ Value: 80
42
+ TimeCenter:
43
+ Description: Highest frequency to extract (1/time_center).
44
+ Type: Float
45
+ Value: 0.001
46
+ Gamma:
47
+ Type: List
48
+ SubType: Float
49
+ Value: [0.24, 0.6, 1.0]
50
+ BinsPerOctave:
51
+ Description: Number of bins for each octave.
52
+ Type: Integer
53
+ Value: 48
54
+ Model:
55
+ Description: Default settings of training / testing the model.
56
+ Settings:
57
+ SavePrefix:
58
+ Description: Prefix of the trained model's name to be saved.
59
+ Type: String
60
+ Value: patch_cnn
61
+ SavePath:
62
+ Description: Path to save the trained model.
63
+ Type: String
64
+ Value: ./checkpoints/patch_cnn
65
+ Dataset:
66
+ Description: Settings of datasets.
67
+ Settings:
68
+ SavePath:
69
+ Description: Path for storing the downloaded datasets.
70
+ Type: String
71
+ Value: ./
72
+ FeatureSavePath:
73
+ Description: Path for storing the extracted feature. Default to the path under the dataset folder.
74
+ Type: String
75
+ Value: +
76
+ Inference:
77
+ Description: Default settings when infering notes.
78
+ Settings:
79
+ Threshold:
80
+ Description: Threshold of the prediction value.
81
+ Type: Float
82
+ Value: 0.5
83
+ MaxMethod:
84
+ Description: Method of determine the position of the max prediction value.
85
+ Type: String
86
+ Value: posterior
87
+ Choices: ["posterior", "prior"]
88
+ Training:
89
+ Description: Hyper parameters for training
90
+ Settings:
91
+ Epoch:
92
+ Description: Maximum number of epochs for training.
93
+ Type: Integer
94
+ Value: 10
95
+ Steps:
96
+ Description: Number of training steps for each epoch.
97
+ Type: Integer
98
+ Value: 1000
99
+ ValSteps:
100
+ Description: Number of validation steps after each training epoch.
101
+ Type: Integer
102
+ Value: 500
103
+ BatchSize:
104
+ Description: Batch size of each training step.
105
+ Type: Integer
106
+ Value: 32
107
+ ValBatchSize:
108
+ Description: Batch size of each validation step.
109
+ Type: Integer
110
+ Value: 32
111
+ EarlyStop:
112
+ Description: Terminate the training if the validation performance doesn't imrove after n epochs.
113
+ Type: Integer
114
+ Value: 4
115
+ InitLearningRate:
116
+ Descriptoin: Initial learning rate.
117
+ Type: Float
118
+ Value: 0.0001
omnizart/patch_cnn/patch_cnn_melody/saved_model.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:78a90299f4b24484dbf4638df16f4bc25af3f2f2b36d37b5197f7de72525f720
3
+ size 155120
omnizart/patch_cnn/patch_cnn_melody/variables/variables.data-00000-of-00001 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bbbd11fc0b60a5f3986c39f7bb3985205d719031f70f916edc560f8b4d01b51a
3
+ size 708098
omnizart/patch_cnn/patch_cnn_melody/variables/variables.index ADDED
Binary file (760 Bytes). View file
 
omnizart/vocal/vocal_contour/configurations.yaml ADDED
@@ -0,0 +1,42 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ General:
2
+ TranscriptionMode:
3
+ Value: VocalContour
4
+ CheckpointPath:
5
+ Value:
6
+ VocalContour: checkpoints/vocal/contour
7
+ Dataset:
8
+ Settings:
9
+ FeatureSavePath:
10
+ Value: +
11
+ SavePath:
12
+ Value: ./
13
+ Feature:
14
+ Settings:
15
+ HopSize:
16
+ Value: 0.02
17
+ SamplingRate:
18
+ Value: 16000
19
+ WindowSize:
20
+ Value: 2049
21
+ Model:
22
+ Settings:
23
+ SavePath:
24
+ Value: ./checkpoints/vocal_frame
25
+ SavePrefix:
26
+ Value: vocal-frame
27
+ Training:
28
+ Settings:
29
+ BatchSize:
30
+ Value: 12
31
+ EarlyStop:
32
+ Value: 3
33
+ Epoch:
34
+ Value: 5
35
+ Steps:
36
+ Value: 6000
37
+ Timesteps:
38
+ Value: 128
39
+ ValBatchSize:
40
+ Value: 12
41
+ ValSteps:
42
+ Value: 200
omnizart/vocal/vocal_contour/saved_model.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8c71303199c361155c4cfac2ea9e5aeb9945ad63f5f9f38961aac59ab29c0a5b
3
+ size 4029577
omnizart/vocal/vocal_contour/variables/variables.data-00000-of-00001 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6b5c76f749ab552d7735fdcd472ebf29dd31d41609fe8b1160b9c037d6919339
3
+ size 50401019
omnizart/vocal/vocal_contour/variables/variables.index ADDED
Binary file (19.2 kB). View file
 
omnizart/vocal/vocal_semi/configurations.yaml ADDED
@@ -0,0 +1,150 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+
2
+ General:
3
+ TranscriptionMode:
4
+ Description: Mode of transcription by executing the `omnizart_fix vocal transcribe` command.
5
+ Type: String
6
+ Value: Semi
7
+ CheckpointPath:
8
+ Description: Path to the pre-trained models.
9
+ Type: Map
10
+ SubType: [String, String]
11
+ Value:
12
+ Super: checkpoints/vocal/vocal_super
13
+ Semi: checkpoints/vocal/vocal_semi
14
+ Feature:
15
+ Description: Default settings of feature extraction for drum transcription.
16
+ Settings:
17
+ HopSize:
18
+ Description: Hop size in seconds with respect to sampling rate.
19
+ Type: Float
20
+ Value: 0.02
21
+ SamplingRate:
22
+ Description: Adjust input sampling rate to this value.
23
+ Type: Integer
24
+ Value: 16000
25
+ FrequencyResolution:
26
+ Type: Float
27
+ Value: 2.0
28
+ FrequencyCenter:
29
+ Description: Lowest frequency to extract.
30
+ Type: Float
31
+ Value: 80
32
+ TimeCenter:
33
+ Description: Highest frequency to extract (1/time_center).
34
+ Type: Float
35
+ Value: 0.001
36
+ Gamma:
37
+ Type: List
38
+ SubType: Float
39
+ Value: [0.24, 0.6, 1.0]
40
+ BinsPerOctave:
41
+ Description: Number of bins for each octave.
42
+ Type: Integer
43
+ Value: 48
44
+ Dataset:
45
+ Description: Settings of datasets.
46
+ Settings:
47
+ SavePath:
48
+ Description: Path for storing the downloaded datasets.
49
+ Type: String
50
+ Value: ./
51
+ FeatureSavePath:
52
+ Description: Path for storing the extracted feature. Default to the path under the dataset folder.
53
+ Type: String
54
+ Value: +
55
+ Model:
56
+ Description: Default settings of training / testing the model.
57
+ Settings:
58
+ SavePrefix:
59
+ Description: Prefix of the trained model's name to be saved.
60
+ Type: String
61
+ Value: vocal
62
+ SavePath:
63
+ Description: Path to save the trained model.
64
+ Type: String
65
+ Value: ./checkpoints/vocal
66
+ MinKernelSize:
67
+ Description: Minimum kernel size of convolution layers in each pyramid block.
68
+ Type: Integer
69
+ Value: 16
70
+ Depth:
71
+ Description: Total number of pyramid blocks will be -> (Depth - 2) / 2 .
72
+ Type: Integer
73
+ Value: 110
74
+ Alpha:
75
+ Type: Integer
76
+ Value: 270
77
+ ShakeDrop:
78
+ Description: Whether to leverage Shake Drop normalization when back propagation.
79
+ Type: Bool
80
+ Value: True
81
+ SemiLossWeight:
82
+ Description: Weighting factor of the semi-supervise loss. Supervised loss will not be affected by this parameter.
83
+ Type: Float
84
+ Value: 1.0
85
+ SemiXi:
86
+ Description: A small constant value for weighting the adverarial perturbation.
87
+ Type: Float
88
+ Value: 0.000001
89
+ SemiEpsilon:
90
+ Description: Weighting factor of the output adversarial perturbation.
91
+ Type: Float
92
+ Value: 8.0
93
+ SemiIterations:
94
+ Description: Number of iterations when generating the adversarial perturbation.
95
+ Type: Integer
96
+ Value: 2
97
+ Inference:
98
+ Description: Default settings when infering notes.
99
+ Settings:
100
+ ContextLength:
101
+ Description: Length of context that will be used to find the peaks.
102
+ Type: Integer
103
+ Value: 2
104
+ Threshold:
105
+ Description: Threshold that will be applied to clip the predicted values to either 0 or 1.
106
+ Type: Float
107
+ Value: 0.5
108
+ MinDuration:
109
+ Description: Minimum required length of each note, in seconds.
110
+ Type: Float
111
+ Value: 0.1
112
+ PitchModel:
113
+ Description: The model for predicting the pitch contour. Default to use vocal-contour modeul. Could be path or mode name.
114
+ Type: String
115
+ Value: VocalContour
116
+ Training:
117
+ Description: Hyper parameters for training
118
+ Settings:
119
+ Epoch:
120
+ Description: Maximum number of epochs for training.
121
+ Type: Integer
122
+ Value: 10
123
+ Steps:
124
+ Description: Number of training steps for each epoch.
125
+ Type: Integer
126
+ Value: 1000
127
+ ValSteps:
128
+ Description: Number of validation steps after each training epoch.
129
+ Type: Integer
130
+ Value: 50
131
+ BatchSize:
132
+ Description: Batch size of each training step.
133
+ Type: Integer
134
+ Value: 64
135
+ ValBatchSize:
136
+ Description: Batch size of each validation step.
137
+ Type: Integer
138
+ Value: 64
139
+ EarlyStop:
140
+ Description: Terminate the training if the validation performance doesn't imrove after n epochs.
141
+ Type: Integer
142
+ Value: 8
143
+ InitLearningRate:
144
+ Descriptoin: Initial learning rate.
145
+ Type: Float
146
+ Value: 0.0001
147
+ ContextLength:
148
+ Description: Context to be considered before and after current timestamp.
149
+ Type: Integer
150
+ Value: 9
omnizart/vocal/vocal_semi/saved_model.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ec5296106686e602b7fa1fc0462911234c3203c5f553b59b99a0d34671466043
3
+ size 14281573
omnizart/vocal/vocal_semi/variables/variables.data-00000-of-00001 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c60c2e441adbe00f7c8c204a1b923e16bb35efa364ed76320bd70356496a9cc3
3
+ size 114617623
omnizart/vocal/vocal_semi/variables/variables.index ADDED
Binary file (45.8 kB). View file