File size: 1,291 Bytes
c7f3ffb
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2566adf
c7f3ffb
 
 
 
 
 
 
2566adf
 
c7f3ffb
 
 
 
 
 
 
 
2566adf
c7f3ffb
 
 
 
 
 
 
2566adf
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
#!/bin/bash

script_dir=$(dirname "$(realpath "$0")")
root_dir=$(dirname "$script_dir")

cd $root_dir || exit
export PYTHONPATH=$root_dir:$PYTHONPATH

device=cuda


####### Run Prompt Annotation #######
audio_path=example/audio/zh_prompt.mp3
save_dir=example/transcriptions/zh_prompt
language=Mandarin
vocal_sep=False
max_merge_duration=30000
midi_transcribe=True    # Whether to transcribe vocal midi, set True for singing voice synthesis, False for singing voice conversion

python -m preprocess.pipeline \
    --audio_path $audio_path \
    --save_dir $save_dir \
    --language $language \
    --device $device \
    --vocal_sep $vocal_sep \
    --max_merge_duration $max_merge_duration \
    --midi_transcribe $midi_transcribe


####### Run Target Annotation #######
audio_path=example/audio/music.mp3
save_dir=example/transcriptions/music
language=Mandarin
vocal_sep=True
max_merge_duration=60000
midi_transcribe=True    # Whether to transcribe vocal midi, set True for singing voice synthesis, False for singing voice conversion

python -m preprocess.pipeline \
    --audio_path $audio_path \
    --save_dir $save_dir \
    --language $language \
    --device $device \
    --vocal_sep $vocal_sep \
    --max_merge_duration $max_merge_duration \
    --midi_transcribe $midi_transcribe