Manage files into transcribe.py
Browse files- transcribe.py +19 -5
transcribe.py
CHANGED
|
@@ -1,9 +1,7 @@
|
|
| 1 |
import os
|
| 2 |
import argparse
|
| 3 |
|
| 4 |
-
def
|
| 5 |
-
audio_file = args.input
|
| 6 |
-
language = args.language
|
| 7 |
output_folder = "transcriptions"
|
| 8 |
|
| 9 |
# Transcribe audio file
|
|
@@ -21,7 +19,23 @@ def main(args):
|
|
| 21 |
|
| 22 |
if __name__ == "__main__":
|
| 23 |
parser = argparse.ArgumentParser(description='Transcribe audio files')
|
| 24 |
-
parser.add_argument('
|
| 25 |
parser.add_argument('language', help='Language of the audio file')
|
|
|
|
| 26 |
args = parser.parse_args()
|
| 27 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
import os
|
| 2 |
import argparse
|
| 3 |
|
| 4 |
+
def transcribe(audio_file, language):
|
|
|
|
|
|
|
| 5 |
output_folder = "transcriptions"
|
| 6 |
|
| 7 |
# Transcribe audio file
|
|
|
|
| 19 |
|
| 20 |
if __name__ == "__main__":
|
| 21 |
parser = argparse.ArgumentParser(description='Transcribe audio files')
|
| 22 |
+
parser.add_argument('input_files', help='Input audio files')
|
| 23 |
parser.add_argument('language', help='Language of the audio file')
|
| 24 |
+
parser.add_argument('speakers_file', help='File with the number of speakers')
|
| 25 |
args = parser.parse_args()
|
| 26 |
+
|
| 27 |
+
vocals_folder = "vocals"
|
| 28 |
+
extension = "wav"
|
| 29 |
+
|
| 30 |
+
with open(args.speakers_file, 'r') as f:
|
| 31 |
+
speakers = f.read().splitlines()
|
| 32 |
+
speakers = int(speakers[0])
|
| 33 |
+
|
| 34 |
+
with open(args.input_files, 'r') as f:
|
| 35 |
+
inputs = f.read().splitlines()
|
| 36 |
+
for input in inputs:
|
| 37 |
+
input, _ = input.split('.')
|
| 38 |
+
_, input_name = input.split('/')
|
| 39 |
+
for i in range(speakers):
|
| 40 |
+
file = f'{vocals_folder}/{input_name}_speaker{i:003d}.{extension}'
|
| 41 |
+
transcribe(file, args.language)
|