Spaces:
Running
Running
File size: 2,632 Bytes
1d8403e | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 | # ==================================================================================================
# DEEPFAKE AUDIO - encoder/config.py (Dataset Manifest & Corpora Configuration)
# ==================================================================================================
#
# π DESCRIPTION
# This module acts as the centralized registry for all speech datasets supported
# by the Speaker Encoder. It defines the directory structures for LibriSpeech,
# LibriTTS, VoxCeleb, and other major open-source corpora. These configurations
# guide the preprocessing scripts in discovering and categorizing audio samples
# for training and validation.
#
# π€ AUTHORS
# - Amey Thakur (https://github.com/Amey-Thakur)
# - Mega Satish (https://github.com/msatmod)
#
# π€π» CREDITS
# Original Real-Time Voice Cloning methodology by CorentinJ
# Repository: https://github.com/CorentinJ/Real-Time-Voice-Cloning
#
# π PROJECT LINKS
# Repository: https://github.com/Amey-Thakur/DEEPFAKE-AUDIO
# Video Demo: https://youtu.be/i3wnBcbHDbs
# Research: https://github.com/Amey-Thakur/DEEPFAKE-AUDIO/blob/main/DEEPFAKE-AUDIO.ipynb
#
# π LICENSE
# Released under the MIT License
# Release Date: 2021-02-06
# ==================================================================================================
# --- LIBRISPEECH MANIFEST ---
librispeech_datasets = {
"train": {
"clean": ["LibriSpeech/train-clean-100", "LibriSpeech/train-clean-360"],
"other": ["LibriSpeech/train-other-500"]
},
"test": {
"clean": ["LibriSpeech/test-clean"],
"other": ["LibriSpeech/test-other"]
},
"dev": {
"clean": ["LibriSpeech/dev-clean"],
"other": ["LibriSpeech/dev-other"]
},
}
# --- LIBRITTS MANIFEST ---
libritts_datasets = {
"train": {
"clean": ["LibriTTS/train-clean-100", "LibriTTS/train-clean-360"],
"other": ["LibriTTS/train-other-500"]
},
"test": {
"clean": ["LibriTTS/test-clean"],
"other": ["LibriTTS/test-other"]
},
"dev": {
"clean": ["LibriTTS/dev-clean"],
"other": ["LibriTTS/dev-other"]
},
}
# --- VOXCELEB MANIFEST (SPEAKER RECOGNITION) ---
voxceleb_datasets = {
"voxceleb1" : {
"train": ["VoxCeleb1/wav"],
"test": ["VoxCeleb1/test_wav"]
},
"voxceleb2" : {
"train": ["VoxCeleb2/dev/aac"],
"test": ["VoxCeleb2/test_wav"]
}
}
# --- MISCELLANEOUS CORPORA ---
other_datasets = [
"LJSpeech-1.1",
"VCTK-Corpus/wav48",
]
# --- LINGUISTIC CATEGORIZATION ---
anglophone_nationalites = ["australia", "canada", "ireland", "uk", "usa"]
|