| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
|
|
| import argparse |
|
|
| from nemo.collections.audio.data.audio_to_audio_lhotse import convert_manifest_nemo_to_lhotse |
|
|
|
|
| def parse_args(): |
| parser = argparse.ArgumentParser( |
| description="Convert an audio-to-audio manifest from NeMo format to Lhotse format. " |
| "This step enables the use of Lhotse datasets for audio-to-audio processing. " |
| ) |
| parser.add_argument("input", help='Path to the input NeMo manifest.') |
| parser.add_argument( |
| "output", help="Path where we'll write the output Lhotse manifest (supported extensions: .jsonl.gz and .jsonl)" |
| ) |
| parser.add_argument( |
| "-i", |
| "--input_key", |
| default="audio_filepath", |
| help="Key of the input recording, mapped to Lhotse's 'Cut.recording'.", |
| ) |
| parser.add_argument( |
| "-t", |
| "--target_key", |
| default="target_filepath", |
| help="Key of the target recording, mapped to Lhotse's 'Cut.target_recording'.", |
| ) |
| parser.add_argument( |
| "-r", |
| "--reference_key", |
| default="reference_filepath", |
| help="Key of the reference recording, mapped to Lhotse's 'Cut.reference_recording'.", |
| ) |
| parser.add_argument( |
| "-e", |
| "--embedding_key", |
| default="embedding_filepath", |
| help="Key of the embedding, mapped to Lhotse's 'Cut.embedding_vector'.", |
| ) |
| parser.add_argument( |
| "-a", |
| "--force_absolute_paths", |
| action='store_true', |
| default=False, |
| help="Force absolute paths in the generated manifests.", |
| ) |
| return parser.parse_args() |
|
|
|
|
| def main(): |
| args = parse_args() |
| convert_manifest_nemo_to_lhotse( |
| input_manifest=args.input, |
| output_manifest=args.output, |
| input_key=args.input_key, |
| target_key=args.target_key, |
| reference_key=args.reference_key, |
| embedding_key=args.embedding_key, |
| force_absolute_paths=args.force_absolute_paths, |
| ) |
|
|
|
|
| if __name__ == "__main__": |
| main() |
|
|