| | |
| | |
| | |
| | |
| | |
| | |
| | |
| | |
| | |
| | |
| | |
| | |
| | |
| |
|
| | import argparse |
| | import random |
| |
|
| | from nemo.collections.asr.parts.utils.manifest_utils import create_manifest |
| |
|
| | random.seed(42) |
| |
|
| | """ |
| | This script creates manifest file for speaker diarization inference purposes. |
| | Useful to get manifest when you have list of audio files and optionally rttm and uem files for evaluation |
| | |
| | Note: make sure basename for each file is unique and rttm files also has the corresponding base name for mapping |
| | """ |
| |
|
| |
|
| | def main( |
| | wav_path, text_path=None, rttm_path=None, uem_path=None, ctm_path=None, manifest_filepath=None, add_duration=False |
| | ): |
| | create_manifest( |
| | wav_path, |
| | manifest_filepath, |
| | text_path=text_path, |
| | rttm_path=rttm_path, |
| | uem_path=uem_path, |
| | ctm_path=ctm_path, |
| | add_duration=add_duration, |
| | ) |
| |
|
| |
|
| | if __name__ == "__main__": |
| | parser = argparse.ArgumentParser() |
| | parser.add_argument( |
| | "--paths2audio_files", help="path to text file containing list of audio files", type=str, required=True |
| | ) |
| | parser.add_argument("--paths2txt_files", help="path to text file containing list of transcription files", type=str) |
| | parser.add_argument("--paths2rttm_files", help="path to text file containing list of rttm files", type=str) |
| | parser.add_argument("--paths2uem_files", help="path to uem files", type=str) |
| | parser.add_argument("--paths2ctm_files", help="path to ctm files", type=str) |
| | parser.add_argument("--manifest_filepath", help="path to output manifest file", type=str, required=True) |
| | parser.add_argument( |
| | "--add_duration", help="add duration of audio files to output manifest files.", action='store_true', |
| | ) |
| | args = parser.parse_args() |
| |
|
| | main( |
| | args.paths2audio_files, |
| | args.paths2txt_files, |
| | args.paths2rttm_files, |
| | args.paths2uem_files, |
| | args.paths2ctm_files, |
| | args.manifest_filepath, |
| | args.add_duration, |
| | ) |
| |
|