Upload folder using huggingface_hub
Browse files- .gitattributes +10 -0
- omnizart/beat/beat_blstm/configurations.yaml +58 -0
- omnizart/beat/beat_blstm/saved_model.pb +3 -0
- omnizart/beat/beat_blstm/variables/variables.data-00000-of-00001 +3 -0
- omnizart/beat/beat_blstm/variables/variables.index +0 -0
- omnizart/chord/chord_v1/configurations.yaml +119 -0
- omnizart/chord/chord_v1/saved_model.pb +3 -0
- omnizart/chord/chord_v1/variables/variables.data-00000-of-00001 +3 -0
- omnizart/chord/chord_v1/variables/variables.index +0 -0
- omnizart/drum/drum_keras/configurations.yaml +115 -0
- omnizart/drum/drum_keras/saved_model.pb +3 -0
- omnizart/drum/drum_keras/variables/variables.data-00000-of-00001 +3 -0
- omnizart/drum/drum_keras/variables/variables.index +0 -0
- omnizart/music/music_note_stream/configurations.yaml +86 -0
- omnizart/music/music_note_stream/saved_model.pb +3 -0
- omnizart/music/music_note_stream/variables/variables.data-00000-of-00001 +3 -0
- omnizart/music/music_note_stream/variables/variables.index +0 -0
- omnizart/music/music_piano-v2/configurations.yaml +88 -0
- omnizart/music/music_piano-v2/saved_model.pb +3 -0
- omnizart/music/music_piano-v2/variables/variables.data-00000-of-00001 +3 -0
- omnizart/music/music_piano-v2/variables/variables.index +0 -0
- omnizart/music/music_piano/configurations.yaml +166 -0
- omnizart/music/music_piano/saved_model.pb +3 -0
- omnizart/music/music_piano/variables/variables.data-00000-of-00001 +3 -0
- omnizart/music/music_piano/variables/variables.index +0 -0
- omnizart/music/music_pop/configurations.yaml +88 -0
- omnizart/music/music_pop/saved_model.pb +3 -0
- omnizart/music/music_pop/variables/variables.data-00000-of-00001 +3 -0
- omnizart/music/music_pop/variables/variables.index +0 -0
- omnizart/patch_cnn/patch_cnn_melody/configurations.yaml +118 -0
- omnizart/patch_cnn/patch_cnn_melody/saved_model.pb +3 -0
- omnizart/patch_cnn/patch_cnn_melody/variables/variables.data-00000-of-00001 +3 -0
- omnizart/patch_cnn/patch_cnn_melody/variables/variables.index +0 -0
- omnizart/vocal/vocal_contour/configurations.yaml +42 -0
- omnizart/vocal/vocal_contour/saved_model.pb +3 -0
- omnizart/vocal/vocal_contour/variables/variables.data-00000-of-00001 +3 -0
- omnizart/vocal/vocal_contour/variables/variables.index +0 -0
- omnizart/vocal/vocal_semi/configurations.yaml +150 -0
- omnizart/vocal/vocal_semi/saved_model.pb +3 -0
- omnizart/vocal/vocal_semi/variables/variables.data-00000-of-00001 +3 -0
- omnizart/vocal/vocal_semi/variables/variables.index +0 -0
.gitattributes
CHANGED
|
@@ -35,3 +35,13 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
| 36 |
basicpitch/nmp/variables/variables.data-00000-of-00001 filter=lfs diff=lfs merge=lfs -text
|
| 37 |
basicpitch/nmp_vamp_plugin/ircambasicpitch.so filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
| 36 |
basicpitch/nmp/variables/variables.data-00000-of-00001 filter=lfs diff=lfs merge=lfs -text
|
| 37 |
basicpitch/nmp_vamp_plugin/ircambasicpitch.so filter=lfs diff=lfs merge=lfs -text
|
| 38 |
+
omnizart/beat/beat_blstm/variables/variables.data-00000-of-00001 filter=lfs diff=lfs merge=lfs -text
|
| 39 |
+
omnizart/chord/chord_v1/variables/variables.data-00000-of-00001 filter=lfs diff=lfs merge=lfs -text
|
| 40 |
+
omnizart/drum/drum_keras/variables/variables.data-00000-of-00001 filter=lfs diff=lfs merge=lfs -text
|
| 41 |
+
omnizart/music/music_note_stream/variables/variables.data-00000-of-00001 filter=lfs diff=lfs merge=lfs -text
|
| 42 |
+
omnizart/music/music_piano/variables/variables.data-00000-of-00001 filter=lfs diff=lfs merge=lfs -text
|
| 43 |
+
omnizart/music/music_piano-v2/variables/variables.data-00000-of-00001 filter=lfs diff=lfs merge=lfs -text
|
| 44 |
+
omnizart/music/music_pop/variables/variables.data-00000-of-00001 filter=lfs diff=lfs merge=lfs -text
|
| 45 |
+
omnizart/patch_cnn/patch_cnn_melody/variables/variables.data-00000-of-00001 filter=lfs diff=lfs merge=lfs -text
|
| 46 |
+
omnizart/vocal/vocal_contour/variables/variables.data-00000-of-00001 filter=lfs diff=lfs merge=lfs -text
|
| 47 |
+
omnizart/vocal/vocal_semi/variables/variables.data-00000-of-00001 filter=lfs diff=lfs merge=lfs -text
|
omnizart/beat/beat_blstm/configurations.yaml
ADDED
|
@@ -0,0 +1,58 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
General:
|
| 2 |
+
CheckpointPath:
|
| 3 |
+
Value:
|
| 4 |
+
BLSTM: checkpoints/beat/beat_blstm
|
| 5 |
+
Dataset:
|
| 6 |
+
Settings:
|
| 7 |
+
FeatureSavePath:
|
| 8 |
+
Value: +
|
| 9 |
+
SavePath:
|
| 10 |
+
Value: ./
|
| 11 |
+
Feature:
|
| 12 |
+
Settings:
|
| 13 |
+
TimeUnit:
|
| 14 |
+
Value: 0.01
|
| 15 |
+
Inference:
|
| 16 |
+
Settings:
|
| 17 |
+
BeatThreshold:
|
| 18 |
+
Value: 0.5
|
| 19 |
+
DownBeatThreshold:
|
| 20 |
+
Value: 0.3
|
| 21 |
+
MinDistance:
|
| 22 |
+
Value: 0.3
|
| 23 |
+
Model:
|
| 24 |
+
Settings:
|
| 25 |
+
AttnHiddenDim:
|
| 26 |
+
Value: 256
|
| 27 |
+
LstmHiddenDim:
|
| 28 |
+
Value: 25
|
| 29 |
+
ModelType:
|
| 30 |
+
Value: blstm
|
| 31 |
+
NumLstmLayers:
|
| 32 |
+
Value: 2
|
| 33 |
+
SavePath:
|
| 34 |
+
Value: ./checkpoints/beat
|
| 35 |
+
SavePrefix:
|
| 36 |
+
Value: beat
|
| 37 |
+
Timesteps:
|
| 38 |
+
Value: 1000
|
| 39 |
+
Training:
|
| 40 |
+
Settings:
|
| 41 |
+
BatchSize:
|
| 42 |
+
Value: 64
|
| 43 |
+
DownBeatWeight:
|
| 44 |
+
Value: 5
|
| 45 |
+
EarlyStop:
|
| 46 |
+
Value: 4
|
| 47 |
+
Epoch:
|
| 48 |
+
Value: 10
|
| 49 |
+
InitLearningRate:
|
| 50 |
+
Value: 0.001
|
| 51 |
+
Steps:
|
| 52 |
+
Value: 2000
|
| 53 |
+
ValBatchSize:
|
| 54 |
+
Value: 64
|
| 55 |
+
ValSteps:
|
| 56 |
+
Value: 200
|
| 57 |
+
TranscriptionMode:
|
| 58 |
+
Value: BLSTM
|
omnizart/beat/beat_blstm/saved_model.pb
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1a0bff208bd559b49df510f2e5177e28b755a29ae36ac690377e00529971417b
|
| 3 |
+
size 5077079
|
omnizart/beat/beat_blstm/variables/variables.data-00000-of-00001
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:673692c2d4cff145bcaad5396d61e480aa442c86f1ac928be2da18568a306057
|
| 3 |
+
size 400241555
|
omnizart/beat/beat_blstm/variables/variables.index
ADDED
|
Binary file (1.23 kB). View file
|
|
|
omnizart/chord/chord_v1/configurations.yaml
ADDED
|
@@ -0,0 +1,119 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
|
| 2 |
+
General:
|
| 3 |
+
TranscriptionMode:
|
| 4 |
+
Description: Mode of transcription by executing the `omnizart_fix chord transcribe` command.
|
| 5 |
+
Type: String
|
| 6 |
+
Value: ChordV1
|
| 7 |
+
CheckpointPath:
|
| 8 |
+
Description: Path to the pre-trained models.
|
| 9 |
+
Type: Map
|
| 10 |
+
SubType: [String, String]
|
| 11 |
+
Value:
|
| 12 |
+
ChordV1: checkpoints/chord/chord_v1
|
| 13 |
+
Feature:
|
| 14 |
+
Description: Default settings of feature extraction for drum transcription.
|
| 15 |
+
Settings:
|
| 16 |
+
SegmentWidth:
|
| 17 |
+
Description: Width of segments. Each frame last for 0.046 seconds, and thus each segment would last for around 0.5 seconds.
|
| 18 |
+
Type: Integer
|
| 19 |
+
Value: 21
|
| 20 |
+
SegmentHop:
|
| 21 |
+
Description: Hop size of the segment.
|
| 22 |
+
Type: Integer
|
| 23 |
+
Value: 5
|
| 24 |
+
NumSteps:
|
| 25 |
+
Description: Number of total steps. Default setting would have around 23 seconds.
|
| 26 |
+
Type: Integer
|
| 27 |
+
Value: 100
|
| 28 |
+
Dataset:
|
| 29 |
+
Description: Settings of datasets.
|
| 30 |
+
Settings:
|
| 31 |
+
SavePath:
|
| 32 |
+
Description: Path for storing the downloaded datasets.
|
| 33 |
+
Type: String
|
| 34 |
+
Value: ./
|
| 35 |
+
FeatureSavePath:
|
| 36 |
+
Description: Path for storing the extracted feature. Default to the path under the dataset folder.
|
| 37 |
+
Type: String
|
| 38 |
+
Value: +
|
| 39 |
+
Model:
|
| 40 |
+
Description: Default settings of training / testing the model.
|
| 41 |
+
Settings:
|
| 42 |
+
SavePrefix:
|
| 43 |
+
Description: Prefix of the trained model's name to be saved.
|
| 44 |
+
Type: String
|
| 45 |
+
Value: chord
|
| 46 |
+
SavePath:
|
| 47 |
+
Description: Path to save the trained model.
|
| 48 |
+
Type: String
|
| 49 |
+
Value: ./checkpoints/chord
|
| 50 |
+
NumEncAttnBlocks:
|
| 51 |
+
Description: Number of attention blocks for encoder.
|
| 52 |
+
Type: Integer
|
| 53 |
+
Value: 2
|
| 54 |
+
NumDecAttnBlocks:
|
| 55 |
+
Description: Number of attention blocks for decoder.
|
| 56 |
+
Type: Integer
|
| 57 |
+
Value: 2
|
| 58 |
+
FreqSize:
|
| 59 |
+
Description: Available size on the frequency axis to be seen.
|
| 60 |
+
Type: Integer
|
| 61 |
+
Value: 24
|
| 62 |
+
EncInputEmbSize:
|
| 63 |
+
Description: Embedding size of the encoder's input.
|
| 64 |
+
Type: Integer
|
| 65 |
+
Value: 512
|
| 66 |
+
DecInputEmbSize:
|
| 67 |
+
Description: Embedding size of the decoder's input.
|
| 68 |
+
Type: Integer
|
| 69 |
+
Value: 512
|
| 70 |
+
DropoutRate:
|
| 71 |
+
Description: Dropout rate of all dropout layers.
|
| 72 |
+
Type: Float
|
| 73 |
+
Value: 0.6
|
| 74 |
+
AnnealingRate:
|
| 75 |
+
Description: To be added...
|
| 76 |
+
Type: Float
|
| 77 |
+
Value: 1.1
|
| 78 |
+
Inference:
|
| 79 |
+
Description: Default settings when infering notes.
|
| 80 |
+
Settings:
|
| 81 |
+
MinDura:
|
| 82 |
+
Description: Minimum duration (in seconds) for each chord. If shorter than expected, will append the duration to the previous chord.
|
| 83 |
+
Type: Float
|
| 84 |
+
Value: 0.1
|
| 85 |
+
Training:
|
| 86 |
+
Description: Hyper parameters for training
|
| 87 |
+
Settings:
|
| 88 |
+
Epoch:
|
| 89 |
+
Description: Maximum number of epochs for training.
|
| 90 |
+
Type: Integer
|
| 91 |
+
Value: 10
|
| 92 |
+
Steps:
|
| 93 |
+
Description: Number of training steps for each epoch.
|
| 94 |
+
Type: Integer
|
| 95 |
+
Value: 1000
|
| 96 |
+
ValSteps:
|
| 97 |
+
Description: Number of validation steps after each training epoch.
|
| 98 |
+
Type: Integer
|
| 99 |
+
Value: 500
|
| 100 |
+
BatchSize:
|
| 101 |
+
Description: Batch size of each training step.
|
| 102 |
+
Type: Integer
|
| 103 |
+
Value: 32
|
| 104 |
+
ValBatchSize:
|
| 105 |
+
Description: Batch size of each validation step.
|
| 106 |
+
Type: Integer
|
| 107 |
+
Value: 32
|
| 108 |
+
EarlyStop:
|
| 109 |
+
Description: Terminate the training if the validation performance doesn't imrove after n epochs.
|
| 110 |
+
Type: Integer
|
| 111 |
+
Value: 4
|
| 112 |
+
InitLearningRate:
|
| 113 |
+
Descriptoin: Initial learning rate.
|
| 114 |
+
Type: Float
|
| 115 |
+
Value: 0.0001
|
| 116 |
+
LearningRateDecay:
|
| 117 |
+
Description: Decaying rate of learning rate per epoch.
|
| 118 |
+
Type: Float
|
| 119 |
+
Value: 0.96
|
omnizart/chord/chord_v1/saved_model.pb
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:489a3db29d528d67d1b7743a0301a4ab81f0803bfcbb0e819615eb64ec67203b
|
| 3 |
+
size 23098326
|
omnizart/chord/chord_v1/variables/variables.data-00000-of-00001
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ba35defa2a043c3cf9d3ef9512a83a6fe6bb62cd247026de50f58bdc0e71317d
|
| 3 |
+
size 44242072
|
omnizart/chord/chord_v1/variables/variables.index
ADDED
|
Binary file (7.13 kB). View file
|
|
|
omnizart/drum/drum_keras/configurations.yaml
ADDED
|
@@ -0,0 +1,115 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
|
| 2 |
+
General:
|
| 3 |
+
TranscriptionMode:
|
| 4 |
+
Description: Mode of transcription by executing the `omnizart_fix transribe drum` command.
|
| 5 |
+
Type: String
|
| 6 |
+
Value: keras
|
| 7 |
+
CheckpointPath:
|
| 8 |
+
Description: Path to the pre-trained models.
|
| 9 |
+
Type: Map
|
| 10 |
+
SubType: [String, String]
|
| 11 |
+
Value:
|
| 12 |
+
keras: ./checkpoints/drum/drum_keras
|
| 13 |
+
Feature:
|
| 14 |
+
Description: Default settings of feature extraction for drum transcription.
|
| 15 |
+
Settings:
|
| 16 |
+
SamplingRate:
|
| 17 |
+
Description: Adjust input sampling rate to this value.
|
| 18 |
+
Type: Integer
|
| 19 |
+
Value: 44100
|
| 20 |
+
PaddingSeconds:
|
| 21 |
+
Description: Padding length to the begin and the end of the raw audio data.
|
| 22 |
+
Type: Float
|
| 23 |
+
Value: 1.0
|
| 24 |
+
LowestNote:
|
| 25 |
+
Description: Lowest MIDI note number to be considered.
|
| 26 |
+
Type: Integer
|
| 27 |
+
Value: 16
|
| 28 |
+
NumberOfNotes:
|
| 29 |
+
Description: Number of total notes to extract.
|
| 30 |
+
Type: Integer
|
| 31 |
+
Value: 120
|
| 32 |
+
HopSize:
|
| 33 |
+
Description: Hop size for computing CQT feature.
|
| 34 |
+
Type: Integer
|
| 35 |
+
Value: 256
|
| 36 |
+
MiniBeatPerBar:
|
| 37 |
+
Description: Number of mini beats in a single 4/4 measure.
|
| 38 |
+
Type: Integer
|
| 39 |
+
Value: 32
|
| 40 |
+
MiniBeatPerSegment:
|
| 41 |
+
Description: Number of mini beats in a single 4/4 measure.
|
| 42 |
+
Type: Integer
|
| 43 |
+
Value: 4
|
| 44 |
+
Dataset:
|
| 45 |
+
Description: Settings of datasets.
|
| 46 |
+
Settings:
|
| 47 |
+
SavePath:
|
| 48 |
+
Description: Path for storing the downloaded datasets.
|
| 49 |
+
Type: String
|
| 50 |
+
Value: ./
|
| 51 |
+
FeatureSavePath:
|
| 52 |
+
Description: Path for storing the extracted feature. Default to the path under the dataset folder.
|
| 53 |
+
Type: String
|
| 54 |
+
Value: +
|
| 55 |
+
Model:
|
| 56 |
+
Description: Default settings of training / testing the model.
|
| 57 |
+
Settings:
|
| 58 |
+
SavePrefix:
|
| 59 |
+
Description: Prefix of the trained model's name to be saved.
|
| 60 |
+
Type: String
|
| 61 |
+
Value: drum
|
| 62 |
+
SavePath:
|
| 63 |
+
Description: Path to save the trained model.
|
| 64 |
+
Type: String
|
| 65 |
+
Value: ./checkpoints/drum
|
| 66 |
+
Inference:
|
| 67 |
+
Description: Default settings when infereing notes.
|
| 68 |
+
Settings:
|
| 69 |
+
BassDrumTh:
|
| 70 |
+
Description: Threshold for the bass drum.
|
| 71 |
+
Type: Float
|
| 72 |
+
Value: 0.85
|
| 73 |
+
SnareTh:
|
| 74 |
+
Description: Threshold for the snare.
|
| 75 |
+
Type: Float
|
| 76 |
+
Value: 1.2
|
| 77 |
+
HihatTh:
|
| 78 |
+
Description: Threshold for the hihat.
|
| 79 |
+
Type: Float
|
| 80 |
+
Value: 0.17
|
| 81 |
+
Training:
|
| 82 |
+
Description: Hyper parameters for training
|
| 83 |
+
Settings:
|
| 84 |
+
Epoch:
|
| 85 |
+
Description: Maximum number of epochs for training.
|
| 86 |
+
Type: Integer
|
| 87 |
+
Value: 50
|
| 88 |
+
Steps:
|
| 89 |
+
Description: Number of training steps for each epoch.
|
| 90 |
+
Type: Integer
|
| 91 |
+
Value: 1000
|
| 92 |
+
ValSteps:
|
| 93 |
+
Description: Number of validation steps after each training epoch.
|
| 94 |
+
Type: Integer
|
| 95 |
+
Value: 100
|
| 96 |
+
BatchSize:
|
| 97 |
+
Description: Batch size of each training step.
|
| 98 |
+
Type: Integer
|
| 99 |
+
Value: 32
|
| 100 |
+
ValBatchSize:
|
| 101 |
+
Description: Batch size of each validation step.
|
| 102 |
+
Type: Integer
|
| 103 |
+
Value: 32
|
| 104 |
+
EarlyStop:
|
| 105 |
+
Description: Terminate the training if the validation performance doesn't imrove after n epochs.
|
| 106 |
+
Type: Integer
|
| 107 |
+
Value: 6
|
| 108 |
+
InitLearningRate:
|
| 109 |
+
Descriptoin: Initial learning rate.
|
| 110 |
+
Type: Float
|
| 111 |
+
Value: 0.00002
|
| 112 |
+
ResBlockNum:
|
| 113 |
+
Description: Number of residual blocks.
|
| 114 |
+
Type: Integer
|
| 115 |
+
Value: 3
|
omnizart/drum/drum_keras/saved_model.pb
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6536f2fd67472cf8fcaea89888410eb6c09b4e3ac72664cb9fffe7441aa6559b
|
| 3 |
+
size 1829175
|
omnizart/drum/drum_keras/variables/variables.data-00000-of-00001
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9e5105215ec8bdee5ebba57c2eef8655a310de99da9f3169b3f857e2185ab464
|
| 3 |
+
size 31090686
|
omnizart/drum/drum_keras/variables/variables.index
ADDED
|
Binary file (5.02 kB). View file
|
|
|
omnizart/music/music_note_stream/configurations.yaml
ADDED
|
@@ -0,0 +1,86 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
General:
|
| 2 |
+
CheckpointPath:
|
| 3 |
+
Value:
|
| 4 |
+
Piano: ./checkpoints/music/music_piano
|
| 5 |
+
Pop: ./checkpoints/music/music_pop
|
| 6 |
+
Dataset:
|
| 7 |
+
Settings:
|
| 8 |
+
FeatureSavePath:
|
| 9 |
+
Value: +
|
| 10 |
+
FeatureType:
|
| 11 |
+
Value: CFP
|
| 12 |
+
SavePath:
|
| 13 |
+
Value: ./
|
| 14 |
+
Feature:
|
| 15 |
+
Settings:
|
| 16 |
+
BinsPerOctave:
|
| 17 |
+
Value: 48
|
| 18 |
+
FrequencyCenter:
|
| 19 |
+
Value: 27.5
|
| 20 |
+
FrequencyResolution:
|
| 21 |
+
Value: 2.0
|
| 22 |
+
Gamma:
|
| 23 |
+
Value:
|
| 24 |
+
- 0.24
|
| 25 |
+
- 0.6
|
| 26 |
+
- 1.0
|
| 27 |
+
Harmonic:
|
| 28 |
+
Value: false
|
| 29 |
+
HarmonicNumber:
|
| 30 |
+
Value: 6
|
| 31 |
+
HopSize:
|
| 32 |
+
Value: 0.02
|
| 33 |
+
SamplingRate:
|
| 34 |
+
Value: 44100
|
| 35 |
+
TimeCenter:
|
| 36 |
+
Value: 0.00022287
|
| 37 |
+
WindowSize:
|
| 38 |
+
Value: 7939
|
| 39 |
+
Inference:
|
| 40 |
+
Settings:
|
| 41 |
+
DuraTh:
|
| 42 |
+
Value: 0.5
|
| 43 |
+
FrameTh:
|
| 44 |
+
Value: 0.5
|
| 45 |
+
InstTh:
|
| 46 |
+
Value: 1.1
|
| 47 |
+
MinLength:
|
| 48 |
+
Value: 0.05
|
| 49 |
+
OnsetTh:
|
| 50 |
+
Value: 6.0
|
| 51 |
+
Model:
|
| 52 |
+
Settings:
|
| 53 |
+
ModelType:
|
| 54 |
+
Value: attn
|
| 55 |
+
SavePath:
|
| 56 |
+
Value: ./checkpoints/music
|
| 57 |
+
SavePrefix:
|
| 58 |
+
Value: music
|
| 59 |
+
Training:
|
| 60 |
+
Settings:
|
| 61 |
+
BatchSize:
|
| 62 |
+
Value: 8
|
| 63 |
+
Channels:
|
| 64 |
+
Value:
|
| 65 |
+
- Spec
|
| 66 |
+
- Ceps
|
| 67 |
+
EarlyStop:
|
| 68 |
+
Value: 6
|
| 69 |
+
Epoch:
|
| 70 |
+
Value: 20
|
| 71 |
+
LabelType:
|
| 72 |
+
Value: note-stream
|
| 73 |
+
LossFunction:
|
| 74 |
+
Value: smooth
|
| 75 |
+
Steps:
|
| 76 |
+
Value: 3000
|
| 77 |
+
Timesteps:
|
| 78 |
+
Value: 128
|
| 79 |
+
ValBatchSize:
|
| 80 |
+
Value: 8
|
| 81 |
+
ValSteps:
|
| 82 |
+
Value: 500
|
| 83 |
+
FeatureNum:
|
| 84 |
+
Value: 352
|
| 85 |
+
TranscriptionMode:
|
| 86 |
+
Value: Stream
|
omnizart/music/music_note_stream/saved_model.pb
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b629d1fe06db9bb056d74857376616cdec7d67884bec4ba08aa48235989e7ea1
|
| 3 |
+
size 4448469
|
omnizart/music/music_note_stream/variables/variables.data-00000-of-00001
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a3f1dce36c255b2e34d69e1faba1e0822723240880b5fdd444613fdb2f29eb15
|
| 3 |
+
size 33495027
|
omnizart/music/music_note_stream/variables/variables.index
ADDED
|
Binary file (18.4 kB). View file
|
|
|
omnizart/music/music_piano-v2/configurations.yaml
ADDED
|
@@ -0,0 +1,88 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
General:
|
| 2 |
+
CheckpointPath:
|
| 3 |
+
Value:
|
| 4 |
+
Piano: checkpoints/music/music_piano
|
| 5 |
+
Pop: checkpoints/music/music_pop
|
| 6 |
+
Stream: checkpoints/music/music_note_stream
|
| 7 |
+
Dataset:
|
| 8 |
+
Settings:
|
| 9 |
+
FeatureSavePath:
|
| 10 |
+
Value: +
|
| 11 |
+
FeatureType:
|
| 12 |
+
Value: CFP
|
| 13 |
+
SavePath:
|
| 14 |
+
Value: ./
|
| 15 |
+
Feature:
|
| 16 |
+
Settings:
|
| 17 |
+
BinsPerOctave:
|
| 18 |
+
Value: 48
|
| 19 |
+
FrequencyCenter:
|
| 20 |
+
Value: 27.5
|
| 21 |
+
FrequencyResolution:
|
| 22 |
+
Value: 2.0
|
| 23 |
+
Gamma:
|
| 24 |
+
Value:
|
| 25 |
+
- 0.24
|
| 26 |
+
- 0.6
|
| 27 |
+
- 1.0
|
| 28 |
+
Harmonic:
|
| 29 |
+
Value: false
|
| 30 |
+
HarmonicNumber:
|
| 31 |
+
Value: 6
|
| 32 |
+
HopSize:
|
| 33 |
+
Value: 0.02
|
| 34 |
+
SamplingRate:
|
| 35 |
+
Value: 44100
|
| 36 |
+
TimeCenter:
|
| 37 |
+
Value: 0.00022287
|
| 38 |
+
WindowSize:
|
| 39 |
+
Value: 7939
|
| 40 |
+
Inference:
|
| 41 |
+
Settings:
|
| 42 |
+
DuraTh:
|
| 43 |
+
Value: 0.5
|
| 44 |
+
FrameTh:
|
| 45 |
+
Value: 0.5
|
| 46 |
+
InstTh:
|
| 47 |
+
Value: 1.1
|
| 48 |
+
MinLength:
|
| 49 |
+
Value: 0.05
|
| 50 |
+
OnsetTh:
|
| 51 |
+
Value: 4
|
| 52 |
+
Model:
|
| 53 |
+
Settings:
|
| 54 |
+
ModelType:
|
| 55 |
+
Value: aspp
|
| 56 |
+
SavePath:
|
| 57 |
+
Value: ./checkpoints/music
|
| 58 |
+
SavePrefix:
|
| 59 |
+
Value: music
|
| 60 |
+
Training:
|
| 61 |
+
Settings:
|
| 62 |
+
BatchSize:
|
| 63 |
+
Value: 16
|
| 64 |
+
Channels:
|
| 65 |
+
Value:
|
| 66 |
+
- Spec
|
| 67 |
+
- Ceps
|
| 68 |
+
- GCoS
|
| 69 |
+
EarlyStop:
|
| 70 |
+
Value: 6
|
| 71 |
+
Epoch:
|
| 72 |
+
Value: 30
|
| 73 |
+
FeatureNum:
|
| 74 |
+
Value: 352
|
| 75 |
+
LabelType:
|
| 76 |
+
Value: note
|
| 77 |
+
LossFunction:
|
| 78 |
+
Value: smooth
|
| 79 |
+
Steps:
|
| 80 |
+
Value: 1500
|
| 81 |
+
Timesteps:
|
| 82 |
+
Value: 256
|
| 83 |
+
ValBatchSize:
|
| 84 |
+
Value: 8
|
| 85 |
+
ValSteps:
|
| 86 |
+
Value: 150
|
| 87 |
+
TranscriptionMode:
|
| 88 |
+
Value: Piano
|
omnizart/music/music_piano-v2/saved_model.pb
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2244e3929e88ae32ad32ad46541eab7ce6803d34c6c37cb9445b50ffc89e9281
|
| 3 |
+
size 4402822
|
omnizart/music/music_piano-v2/variables/variables.data-00000-of-00001
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a3316d5fed8054bb7f6aa18021d6787484808894a1eceacea0f9a9f2fe1fb684
|
| 3 |
+
size 84656908
|
omnizart/music/music_piano-v2/variables/variables.index
ADDED
|
Binary file (21.1 kB). View file
|
|
|
omnizart/music/music_piano/configurations.yaml
ADDED
|
@@ -0,0 +1,166 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
# Self-documented configurable settings, with description, type hint, and available
|
| 2 |
+
# options. All the parameters can be overriden by another specified configuration file
|
| 3 |
+
# with selected parameters.
|
| 4 |
+
|
| 5 |
+
|
| 6 |
+
General:
|
| 7 |
+
TranscriptionMode:
|
| 8 |
+
Description: Mode of transcription by executing the `omnizart_fix transribe music` command.
|
| 9 |
+
Type: String
|
| 10 |
+
Value: Piano
|
| 11 |
+
CheckpointPath:
|
| 12 |
+
Description: Path to the pre-trained models.
|
| 13 |
+
Type: Map
|
| 14 |
+
SubType: [String, String]
|
| 15 |
+
Value:
|
| 16 |
+
Piano: ./checkpoints/music/music_piano
|
| 17 |
+
Pop: ./checkpoints/music/music_pop
|
| 18 |
+
Stream: ./checkpoints/music/music_note_stream
|
| 19 |
+
Feature:
|
| 20 |
+
Description: Default settings of feature extraction
|
| 21 |
+
Settings:
|
| 22 |
+
HopSize:
|
| 23 |
+
Description: Hop size in seconds with respect to sampling rate.
|
| 24 |
+
Type: Float
|
| 25 |
+
Value: 0.02
|
| 26 |
+
SamplingRate:
|
| 27 |
+
Description: Adjust input sampling rate to this value.
|
| 28 |
+
Type: Integer
|
| 29 |
+
Value: 44100
|
| 30 |
+
WindowSize:
|
| 31 |
+
Type: Integer
|
| 32 |
+
Value: 7939
|
| 33 |
+
FrequencyResolution:
|
| 34 |
+
Type: Float
|
| 35 |
+
Value: 2.0
|
| 36 |
+
FrequencyCenter:
|
| 37 |
+
Description: Lowest frequency to extract.
|
| 38 |
+
Type: Float
|
| 39 |
+
Value: 27.5
|
| 40 |
+
TimeCenter:
|
| 41 |
+
Description: Highest frequency to extract (1/time_center).
|
| 42 |
+
Type: Float
|
| 43 |
+
Value: 0.00022287
|
| 44 |
+
Gamma:
|
| 45 |
+
Type: List
|
| 46 |
+
SubType: Float
|
| 47 |
+
Value: [0.24, 0.6, 1.0]
|
| 48 |
+
BinsPerOctave:
|
| 49 |
+
Description: Number of bins for each octave.
|
| 50 |
+
Type: Integer
|
| 51 |
+
Value: 48
|
| 52 |
+
HarmonicNumber:
|
| 53 |
+
Description: Number of harmonic bins of HCFP feature.
|
| 54 |
+
Type: Integer
|
| 55 |
+
Value: 6
|
| 56 |
+
Harmonic:
|
| 57 |
+
Description: Whether to use harmonic version of the input feature for training.
|
| 58 |
+
Type: Bool
|
| 59 |
+
Value: False
|
| 60 |
+
Dataset:
|
| 61 |
+
Description: Settings of datasets.
|
| 62 |
+
Settings:
|
| 63 |
+
SavePath:
|
| 64 |
+
Description: Path for storing the downloaded datasets.
|
| 65 |
+
Type: String
|
| 66 |
+
Value: ./
|
| 67 |
+
FeatureType:
|
| 68 |
+
Description: Type of feature to extract.
|
| 69 |
+
Type: String
|
| 70 |
+
Value: CFP
|
| 71 |
+
Choices: ["CFP", "HCFP"]
|
| 72 |
+
FeatureSavePath:
|
| 73 |
+
Description: Path for storing the extracted feature. Default to the path under the dataset folder.
|
| 74 |
+
Type: String
|
| 75 |
+
Value: +
|
| 76 |
+
Model:
|
| 77 |
+
Description: Default settings of training / testing the model.
|
| 78 |
+
Settings:
|
| 79 |
+
SavePrefix:
|
| 80 |
+
Description: Prefix of the trained model's name to be saved.
|
| 81 |
+
Type: String
|
| 82 |
+
Value: music
|
| 83 |
+
SavePath:
|
| 84 |
+
Description: Path to save the trained model.
|
| 85 |
+
Type: String
|
| 86 |
+
Value: ./checkpoints/music
|
| 87 |
+
ModelType:
|
| 88 |
+
Description: Default model type to be used for training
|
| 89 |
+
Type: String
|
| 90 |
+
Value: attn
|
| 91 |
+
Choices: ["aspp", "attn"]
|
| 92 |
+
Inference:
|
| 93 |
+
Description: Default settings when infering notes.
|
| 94 |
+
Settings:
|
| 95 |
+
MinLength:
|
| 96 |
+
Description: Minimum length of a note in seconds.
|
| 97 |
+
Type: Float
|
| 98 |
+
Value: 0.05
|
| 99 |
+
InstTh:
|
| 100 |
+
Description: Threshold for filtering instruments.
|
| 101 |
+
Type: Float
|
| 102 |
+
Value: 1.1
|
| 103 |
+
OnsetTh:
|
| 104 |
+
Description: Threshold of predicted onset channel.
|
| 105 |
+
Type: Float
|
| 106 |
+
Value: 4
|
| 107 |
+
DuraTh:
|
| 108 |
+
Description: Threshold of predicted duration channel.
|
| 109 |
+
Type: Float
|
| 110 |
+
Value: 0.5
|
| 111 |
+
FrameTh:
|
| 112 |
+
Description: Threshold of frame-level predictions.
|
| 113 |
+
Type: Float
|
| 114 |
+
Value: 0.5
|
| 115 |
+
Training:
|
| 116 |
+
Description: Parameters for training
|
| 117 |
+
Settings:
|
| 118 |
+
Epoch:
|
| 119 |
+
Description: Maximum number of epochs for training.
|
| 120 |
+
Type: Integer
|
| 121 |
+
Value: 20
|
| 122 |
+
Steps:
|
| 123 |
+
Description: Number of training steps for each epoch.
|
| 124 |
+
Type: Integer
|
| 125 |
+
Value: 3000
|
| 126 |
+
ValSteps:
|
| 127 |
+
Description: Number of validation steps after each training epoch.
|
| 128 |
+
Type: Integer
|
| 129 |
+
Value: 500
|
| 130 |
+
BatchSize:
|
| 131 |
+
Description: Batch size of each training step.
|
| 132 |
+
Type: Integer
|
| 133 |
+
Value: 8
|
| 134 |
+
ValBatchSize:
|
| 135 |
+
Description: Batchs size of each validation step.
|
| 136 |
+
Type: Integer
|
| 137 |
+
Value: 8
|
| 138 |
+
EarlyStop:
|
| 139 |
+
Description: Terminate the training if the validation performance doesn't imrove after n epochs.
|
| 140 |
+
Type: Integer
|
| 141 |
+
Value: 6
|
| 142 |
+
LossFunction:
|
| 143 |
+
Description: Loss function for computing the objectives.
|
| 144 |
+
Type: String
|
| 145 |
+
Value: smooth
|
| 146 |
+
Choices: ["smooth", "focal", "bce"]
|
| 147 |
+
LabelType:
|
| 148 |
+
Description: Determines the training target to be single- or multi-instrument scenario, and more options.
|
| 149 |
+
Type: String
|
| 150 |
+
Value: note
|
| 151 |
+
Choices: ["note-stream", "frame-stream", "note", "frame"]
|
| 152 |
+
Channels:
|
| 153 |
+
Description: Use different types of feature for training.
|
| 154 |
+
Type: List
|
| 155 |
+
SubType: String
|
| 156 |
+
Value: ["Spec", "Ceps"]
|
| 157 |
+
Choices: ["Spec", "GCoS", "Ceps"]
|
| 158 |
+
Timesteps:
|
| 159 |
+
Description: Length of time axis of the input feature.
|
| 160 |
+
Type: Integer
|
| 161 |
+
Value: 128
|
| 162 |
+
FeatureNum:
|
| 163 |
+
Description: The target size of feature dimension.
|
| 164 |
+
Type: Integer
|
| 165 |
+
Value: 384
|
| 166 |
+
|
omnizart/music/music_piano/saved_model.pb
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f90191ba7c4dd251db9600119581a7a71daf35266da57097694861b325429e23
|
| 3 |
+
size 4027989
|
omnizart/music/music_piano/variables/variables.data-00000-of-00001
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:bd93da1d0b4e2a59f8c473580380d2388df7ec86d0c8d7803a2863c530d005bf
|
| 3 |
+
size 50407445
|
omnizart/music/music_piano/variables/variables.index
ADDED
|
Binary file (19.2 kB). View file
|
|
|
omnizart/music/music_pop/configurations.yaml
ADDED
|
@@ -0,0 +1,88 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
General:
|
| 2 |
+
CheckpointPath:
|
| 3 |
+
Value:
|
| 4 |
+
Piano: checkpoints/music/music_piano
|
| 5 |
+
Pop: checkpoints/music/music_pop
|
| 6 |
+
Stream: checkpoints/music/music_note_stream
|
| 7 |
+
Dataset:
|
| 8 |
+
Settings:
|
| 9 |
+
FeatureSavePath:
|
| 10 |
+
Value: +
|
| 11 |
+
FeatureType:
|
| 12 |
+
Value: CFP
|
| 13 |
+
SavePath:
|
| 14 |
+
Value: ./
|
| 15 |
+
Feature:
|
| 16 |
+
Settings:
|
| 17 |
+
BinsPerOctave:
|
| 18 |
+
Value: 48
|
| 19 |
+
FrequencyCenter:
|
| 20 |
+
Value: 27.5
|
| 21 |
+
FrequencyResolution:
|
| 22 |
+
Value: 2.0
|
| 23 |
+
Gamma:
|
| 24 |
+
Value:
|
| 25 |
+
- 0.24
|
| 26 |
+
- 0.6
|
| 27 |
+
- 1.0
|
| 28 |
+
Harmonic:
|
| 29 |
+
Value: false
|
| 30 |
+
HarmonicNumber:
|
| 31 |
+
Value: 6
|
| 32 |
+
HopSize:
|
| 33 |
+
Value: 0.02
|
| 34 |
+
SamplingRate:
|
| 35 |
+
Value: 44100
|
| 36 |
+
TimeCenter:
|
| 37 |
+
Value: 0.00022287
|
| 38 |
+
WindowSize:
|
| 39 |
+
Value: 7939
|
| 40 |
+
Inference:
|
| 41 |
+
Settings:
|
| 42 |
+
DuraTh:
|
| 43 |
+
Value: 0.5
|
| 44 |
+
FrameTh:
|
| 45 |
+
Value: 0.5
|
| 46 |
+
InstTh:
|
| 47 |
+
Value: 1.1
|
| 48 |
+
MinLength:
|
| 49 |
+
Value: 0.05
|
| 50 |
+
OnsetTh:
|
| 51 |
+
Value: 6.0
|
| 52 |
+
Model:
|
| 53 |
+
Settings:
|
| 54 |
+
ModelType:
|
| 55 |
+
Value: attn
|
| 56 |
+
SavePath:
|
| 57 |
+
Value: ./checkpoints/music
|
| 58 |
+
SavePrefix:
|
| 59 |
+
Value: music
|
| 60 |
+
Training:
|
| 61 |
+
Settings:
|
| 62 |
+
BatchSize:
|
| 63 |
+
Value: 8
|
| 64 |
+
Channels:
|
| 65 |
+
Value:
|
| 66 |
+
- Spec
|
| 67 |
+
- Ceps
|
| 68 |
+
- GCoS
|
| 69 |
+
EarlyStop:
|
| 70 |
+
Value: 6
|
| 71 |
+
Epoch:
|
| 72 |
+
Value: 20
|
| 73 |
+
FeatureNum:
|
| 74 |
+
Value: 352
|
| 75 |
+
LabelType:
|
| 76 |
+
Value: pop-note-stream
|
| 77 |
+
LossFunction:
|
| 78 |
+
Value: smooth
|
| 79 |
+
Steps:
|
| 80 |
+
Value: 3000
|
| 81 |
+
Timesteps:
|
| 82 |
+
Value: 128
|
| 83 |
+
ValBatchSize:
|
| 84 |
+
Value: 8
|
| 85 |
+
ValSteps:
|
| 86 |
+
Value: 500
|
| 87 |
+
TranscriptionMode:
|
| 88 |
+
Value: Pop
|
omnizart/music/music_pop/saved_model.pb
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:80374501dc49c07296419ca8850bbf8008d6fd76aa3f447ad91add482a9a42a7
|
| 3 |
+
size 4448052
|
omnizart/music/music_pop/variables/variables.data-00000-of-00001
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7cf77d6b5e95f4034d824049104cc93830a8a2c40399eb45dc8488ad072aeeb4
|
| 3 |
+
size 33498559
|
omnizart/music/music_pop/variables/variables.index
ADDED
|
Binary file (18.4 kB). View file
|
|
|
omnizart/patch_cnn/patch_cnn_melody/configurations.yaml
ADDED
|
@@ -0,0 +1,118 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
|
| 2 |
+
General:
|
| 3 |
+
TranscriptionMode:
|
| 4 |
+
Description: Mode of transcription by executing the `omnizart_fix patch-cnn transcribe` command.
|
| 5 |
+
Type: String
|
| 6 |
+
Value: Melody
|
| 7 |
+
CheckpointPath:
|
| 8 |
+
Description: Path to the pre-trained models.
|
| 9 |
+
Type: Map
|
| 10 |
+
SubType: [String, String]
|
| 11 |
+
Value:
|
| 12 |
+
Melody: checkpoints/patch_cnn/patch_cnn_melody
|
| 13 |
+
Feature:
|
| 14 |
+
Description: Default settings of feature extraction
|
| 15 |
+
Settings:
|
| 16 |
+
PatchSize:
|
| 17 |
+
Description: Input size of feature dimension.
|
| 18 |
+
Type: Integer
|
| 19 |
+
Value: 25
|
| 20 |
+
PeakThreshold:
|
| 21 |
+
Description: Threshold used to filter out peaks with small value.
|
| 22 |
+
Type: Float
|
| 23 |
+
Value: 0.5
|
| 24 |
+
HopSize:
|
| 25 |
+
Description: Hop size in seconds with respect to sampling rate.
|
| 26 |
+
Type: Float
|
| 27 |
+
Value: 0.02
|
| 28 |
+
SamplingRate:
|
| 29 |
+
Description: Adjust input sampling rate to this value.
|
| 30 |
+
Type: Integer
|
| 31 |
+
Value: 16000
|
| 32 |
+
WindowSize:
|
| 33 |
+
Type: Integer
|
| 34 |
+
Value: 2049
|
| 35 |
+
FrequencyResolution:
|
| 36 |
+
Type: Float
|
| 37 |
+
Value: 2.0
|
| 38 |
+
FrequencyCenter:
|
| 39 |
+
Description: Lowest frequency to extract.
|
| 40 |
+
Type: Float
|
| 41 |
+
Value: 80
|
| 42 |
+
TimeCenter:
|
| 43 |
+
Description: Highest frequency to extract (1/time_center).
|
| 44 |
+
Type: Float
|
| 45 |
+
Value: 0.001
|
| 46 |
+
Gamma:
|
| 47 |
+
Type: List
|
| 48 |
+
SubType: Float
|
| 49 |
+
Value: [0.24, 0.6, 1.0]
|
| 50 |
+
BinsPerOctave:
|
| 51 |
+
Description: Number of bins for each octave.
|
| 52 |
+
Type: Integer
|
| 53 |
+
Value: 48
|
| 54 |
+
Model:
|
| 55 |
+
Description: Default settings of training / testing the model.
|
| 56 |
+
Settings:
|
| 57 |
+
SavePrefix:
|
| 58 |
+
Description: Prefix of the trained model's name to be saved.
|
| 59 |
+
Type: String
|
| 60 |
+
Value: patch_cnn
|
| 61 |
+
SavePath:
|
| 62 |
+
Description: Path to save the trained model.
|
| 63 |
+
Type: String
|
| 64 |
+
Value: ./checkpoints/patch_cnn
|
| 65 |
+
Dataset:
|
| 66 |
+
Description: Settings of datasets.
|
| 67 |
+
Settings:
|
| 68 |
+
SavePath:
|
| 69 |
+
Description: Path for storing the downloaded datasets.
|
| 70 |
+
Type: String
|
| 71 |
+
Value: ./
|
| 72 |
+
FeatureSavePath:
|
| 73 |
+
Description: Path for storing the extracted feature. Default to the path under the dataset folder.
|
| 74 |
+
Type: String
|
| 75 |
+
Value: +
|
| 76 |
+
Inference:
|
| 77 |
+
Description: Default settings when infering notes.
|
| 78 |
+
Settings:
|
| 79 |
+
Threshold:
|
| 80 |
+
Description: Threshold of the prediction value.
|
| 81 |
+
Type: Float
|
| 82 |
+
Value: 0.5
|
| 83 |
+
MaxMethod:
|
| 84 |
+
Description: Method of determine the position of the max prediction value.
|
| 85 |
+
Type: String
|
| 86 |
+
Value: posterior
|
| 87 |
+
Choices: ["posterior", "prior"]
|
| 88 |
+
Training:
|
| 89 |
+
Description: Hyper parameters for training
|
| 90 |
+
Settings:
|
| 91 |
+
Epoch:
|
| 92 |
+
Description: Maximum number of epochs for training.
|
| 93 |
+
Type: Integer
|
| 94 |
+
Value: 10
|
| 95 |
+
Steps:
|
| 96 |
+
Description: Number of training steps for each epoch.
|
| 97 |
+
Type: Integer
|
| 98 |
+
Value: 1000
|
| 99 |
+
ValSteps:
|
| 100 |
+
Description: Number of validation steps after each training epoch.
|
| 101 |
+
Type: Integer
|
| 102 |
+
Value: 500
|
| 103 |
+
BatchSize:
|
| 104 |
+
Description: Batch size of each training step.
|
| 105 |
+
Type: Integer
|
| 106 |
+
Value: 32
|
| 107 |
+
ValBatchSize:
|
| 108 |
+
Description: Batch size of each validation step.
|
| 109 |
+
Type: Integer
|
| 110 |
+
Value: 32
|
| 111 |
+
EarlyStop:
|
| 112 |
+
Description: Terminate the training if the validation performance doesn't imrove after n epochs.
|
| 113 |
+
Type: Integer
|
| 114 |
+
Value: 4
|
| 115 |
+
InitLearningRate:
|
| 116 |
+
Descriptoin: Initial learning rate.
|
| 117 |
+
Type: Float
|
| 118 |
+
Value: 0.0001
|
omnizart/patch_cnn/patch_cnn_melody/saved_model.pb
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:78a90299f4b24484dbf4638df16f4bc25af3f2f2b36d37b5197f7de72525f720
|
| 3 |
+
size 155120
|
omnizart/patch_cnn/patch_cnn_melody/variables/variables.data-00000-of-00001
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:bbbd11fc0b60a5f3986c39f7bb3985205d719031f70f916edc560f8b4d01b51a
|
| 3 |
+
size 708098
|
omnizart/patch_cnn/patch_cnn_melody/variables/variables.index
ADDED
|
Binary file (760 Bytes). View file
|
|
|
omnizart/vocal/vocal_contour/configurations.yaml
ADDED
|
@@ -0,0 +1,42 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
General:
|
| 2 |
+
TranscriptionMode:
|
| 3 |
+
Value: VocalContour
|
| 4 |
+
CheckpointPath:
|
| 5 |
+
Value:
|
| 6 |
+
VocalContour: checkpoints/vocal/contour
|
| 7 |
+
Dataset:
|
| 8 |
+
Settings:
|
| 9 |
+
FeatureSavePath:
|
| 10 |
+
Value: +
|
| 11 |
+
SavePath:
|
| 12 |
+
Value: ./
|
| 13 |
+
Feature:
|
| 14 |
+
Settings:
|
| 15 |
+
HopSize:
|
| 16 |
+
Value: 0.02
|
| 17 |
+
SamplingRate:
|
| 18 |
+
Value: 16000
|
| 19 |
+
WindowSize:
|
| 20 |
+
Value: 2049
|
| 21 |
+
Model:
|
| 22 |
+
Settings:
|
| 23 |
+
SavePath:
|
| 24 |
+
Value: ./checkpoints/vocal_frame
|
| 25 |
+
SavePrefix:
|
| 26 |
+
Value: vocal-frame
|
| 27 |
+
Training:
|
| 28 |
+
Settings:
|
| 29 |
+
BatchSize:
|
| 30 |
+
Value: 12
|
| 31 |
+
EarlyStop:
|
| 32 |
+
Value: 3
|
| 33 |
+
Epoch:
|
| 34 |
+
Value: 5
|
| 35 |
+
Steps:
|
| 36 |
+
Value: 6000
|
| 37 |
+
Timesteps:
|
| 38 |
+
Value: 128
|
| 39 |
+
ValBatchSize:
|
| 40 |
+
Value: 12
|
| 41 |
+
ValSteps:
|
| 42 |
+
Value: 200
|
omnizart/vocal/vocal_contour/saved_model.pb
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8c71303199c361155c4cfac2ea9e5aeb9945ad63f5f9f38961aac59ab29c0a5b
|
| 3 |
+
size 4029577
|
omnizart/vocal/vocal_contour/variables/variables.data-00000-of-00001
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6b5c76f749ab552d7735fdcd472ebf29dd31d41609fe8b1160b9c037d6919339
|
| 3 |
+
size 50401019
|
omnizart/vocal/vocal_contour/variables/variables.index
ADDED
|
Binary file (19.2 kB). View file
|
|
|
omnizart/vocal/vocal_semi/configurations.yaml
ADDED
|
@@ -0,0 +1,150 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
|
| 2 |
+
General:
|
| 3 |
+
TranscriptionMode:
|
| 4 |
+
Description: Mode of transcription by executing the `omnizart_fix vocal transcribe` command.
|
| 5 |
+
Type: String
|
| 6 |
+
Value: Semi
|
| 7 |
+
CheckpointPath:
|
| 8 |
+
Description: Path to the pre-trained models.
|
| 9 |
+
Type: Map
|
| 10 |
+
SubType: [String, String]
|
| 11 |
+
Value:
|
| 12 |
+
Super: checkpoints/vocal/vocal_super
|
| 13 |
+
Semi: checkpoints/vocal/vocal_semi
|
| 14 |
+
Feature:
|
| 15 |
+
Description: Default settings of feature extraction for drum transcription.
|
| 16 |
+
Settings:
|
| 17 |
+
HopSize:
|
| 18 |
+
Description: Hop size in seconds with respect to sampling rate.
|
| 19 |
+
Type: Float
|
| 20 |
+
Value: 0.02
|
| 21 |
+
SamplingRate:
|
| 22 |
+
Description: Adjust input sampling rate to this value.
|
| 23 |
+
Type: Integer
|
| 24 |
+
Value: 16000
|
| 25 |
+
FrequencyResolution:
|
| 26 |
+
Type: Float
|
| 27 |
+
Value: 2.0
|
| 28 |
+
FrequencyCenter:
|
| 29 |
+
Description: Lowest frequency to extract.
|
| 30 |
+
Type: Float
|
| 31 |
+
Value: 80
|
| 32 |
+
TimeCenter:
|
| 33 |
+
Description: Highest frequency to extract (1/time_center).
|
| 34 |
+
Type: Float
|
| 35 |
+
Value: 0.001
|
| 36 |
+
Gamma:
|
| 37 |
+
Type: List
|
| 38 |
+
SubType: Float
|
| 39 |
+
Value: [0.24, 0.6, 1.0]
|
| 40 |
+
BinsPerOctave:
|
| 41 |
+
Description: Number of bins for each octave.
|
| 42 |
+
Type: Integer
|
| 43 |
+
Value: 48
|
| 44 |
+
Dataset:
|
| 45 |
+
Description: Settings of datasets.
|
| 46 |
+
Settings:
|
| 47 |
+
SavePath:
|
| 48 |
+
Description: Path for storing the downloaded datasets.
|
| 49 |
+
Type: String
|
| 50 |
+
Value: ./
|
| 51 |
+
FeatureSavePath:
|
| 52 |
+
Description: Path for storing the extracted feature. Default to the path under the dataset folder.
|
| 53 |
+
Type: String
|
| 54 |
+
Value: +
|
| 55 |
+
Model:
|
| 56 |
+
Description: Default settings of training / testing the model.
|
| 57 |
+
Settings:
|
| 58 |
+
SavePrefix:
|
| 59 |
+
Description: Prefix of the trained model's name to be saved.
|
| 60 |
+
Type: String
|
| 61 |
+
Value: vocal
|
| 62 |
+
SavePath:
|
| 63 |
+
Description: Path to save the trained model.
|
| 64 |
+
Type: String
|
| 65 |
+
Value: ./checkpoints/vocal
|
| 66 |
+
MinKernelSize:
|
| 67 |
+
Description: Minimum kernel size of convolution layers in each pyramid block.
|
| 68 |
+
Type: Integer
|
| 69 |
+
Value: 16
|
| 70 |
+
Depth:
|
| 71 |
+
Description: Total number of pyramid blocks will be -> (Depth - 2) / 2 .
|
| 72 |
+
Type: Integer
|
| 73 |
+
Value: 110
|
| 74 |
+
Alpha:
|
| 75 |
+
Type: Integer
|
| 76 |
+
Value: 270
|
| 77 |
+
ShakeDrop:
|
| 78 |
+
Description: Whether to leverage Shake Drop normalization when back propagation.
|
| 79 |
+
Type: Bool
|
| 80 |
+
Value: True
|
| 81 |
+
SemiLossWeight:
|
| 82 |
+
Description: Weighting factor of the semi-supervise loss. Supervised loss will not be affected by this parameter.
|
| 83 |
+
Type: Float
|
| 84 |
+
Value: 1.0
|
| 85 |
+
SemiXi:
|
| 86 |
+
Description: A small constant value for weighting the adverarial perturbation.
|
| 87 |
+
Type: Float
|
| 88 |
+
Value: 0.000001
|
| 89 |
+
SemiEpsilon:
|
| 90 |
+
Description: Weighting factor of the output adversarial perturbation.
|
| 91 |
+
Type: Float
|
| 92 |
+
Value: 8.0
|
| 93 |
+
SemiIterations:
|
| 94 |
+
Description: Number of iterations when generating the adversarial perturbation.
|
| 95 |
+
Type: Integer
|
| 96 |
+
Value: 2
|
| 97 |
+
Inference:
|
| 98 |
+
Description: Default settings when infering notes.
|
| 99 |
+
Settings:
|
| 100 |
+
ContextLength:
|
| 101 |
+
Description: Length of context that will be used to find the peaks.
|
| 102 |
+
Type: Integer
|
| 103 |
+
Value: 2
|
| 104 |
+
Threshold:
|
| 105 |
+
Description: Threshold that will be applied to clip the predicted values to either 0 or 1.
|
| 106 |
+
Type: Float
|
| 107 |
+
Value: 0.5
|
| 108 |
+
MinDuration:
|
| 109 |
+
Description: Minimum required length of each note, in seconds.
|
| 110 |
+
Type: Float
|
| 111 |
+
Value: 0.1
|
| 112 |
+
PitchModel:
|
| 113 |
+
Description: The model for predicting the pitch contour. Default to use vocal-contour modeul. Could be path or mode name.
|
| 114 |
+
Type: String
|
| 115 |
+
Value: VocalContour
|
| 116 |
+
Training:
|
| 117 |
+
Description: Hyper parameters for training
|
| 118 |
+
Settings:
|
| 119 |
+
Epoch:
|
| 120 |
+
Description: Maximum number of epochs for training.
|
| 121 |
+
Type: Integer
|
| 122 |
+
Value: 10
|
| 123 |
+
Steps:
|
| 124 |
+
Description: Number of training steps for each epoch.
|
| 125 |
+
Type: Integer
|
| 126 |
+
Value: 1000
|
| 127 |
+
ValSteps:
|
| 128 |
+
Description: Number of validation steps after each training epoch.
|
| 129 |
+
Type: Integer
|
| 130 |
+
Value: 50
|
| 131 |
+
BatchSize:
|
| 132 |
+
Description: Batch size of each training step.
|
| 133 |
+
Type: Integer
|
| 134 |
+
Value: 64
|
| 135 |
+
ValBatchSize:
|
| 136 |
+
Description: Batch size of each validation step.
|
| 137 |
+
Type: Integer
|
| 138 |
+
Value: 64
|
| 139 |
+
EarlyStop:
|
| 140 |
+
Description: Terminate the training if the validation performance doesn't imrove after n epochs.
|
| 141 |
+
Type: Integer
|
| 142 |
+
Value: 8
|
| 143 |
+
InitLearningRate:
|
| 144 |
+
Descriptoin: Initial learning rate.
|
| 145 |
+
Type: Float
|
| 146 |
+
Value: 0.0001
|
| 147 |
+
ContextLength:
|
| 148 |
+
Description: Context to be considered before and after current timestamp.
|
| 149 |
+
Type: Integer
|
| 150 |
+
Value: 9
|
omnizart/vocal/vocal_semi/saved_model.pb
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ec5296106686e602b7fa1fc0462911234c3203c5f553b59b99a0d34671466043
|
| 3 |
+
size 14281573
|
omnizart/vocal/vocal_semi/variables/variables.data-00000-of-00001
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c60c2e441adbe00f7c8c204a1b923e16bb35efa364ed76320bd70356496a9cc3
|
| 3 |
+
size 114617623
|
omnizart/vocal/vocal_semi/variables/variables.index
ADDED
|
Binary file (45.8 kB). View file
|
|
|