Spaces:

ameythakur
/

Deepfake-Audio

Running

App Files Files Community

Deepfake-Audio / Source Code /encoder /config.py

ameythakur

Deepfake-Audio

1d8403e verified about 2 months ago

raw

history blame contribute delete

2.63 kB

	# ==================================================================================================
	# DEEPFAKE AUDIO - encoder/config.py (Dataset Manifest & Corpora Configuration)
	# ==================================================================================================
	#
	# 📝 DESCRIPTION
	# This module acts as the centralized registry for all speech datasets supported
	# by the Speaker Encoder. It defines the directory structures for LibriSpeech,
	# LibriTTS, VoxCeleb, and other major open-source corpora. These configurations
	# guide the preprocessing scripts in discovering and categorizing audio samples
	# for training and validation.
	#
	# 👤 AUTHORS
	# - Amey Thakur (https://github.com/Amey-Thakur)
	# - Mega Satish (https://github.com/msatmod)
	#
	# 🤝🏻 CREDITS
	# Original Real-Time Voice Cloning methodology by CorentinJ
	# Repository: https://github.com/CorentinJ/Real-Time-Voice-Cloning
	#
	# 🔗 PROJECT LINKS
	# Repository: https://github.com/Amey-Thakur/DEEPFAKE-AUDIO
	# Video Demo: https://youtu.be/i3wnBcbHDbs
	# Research: https://github.com/Amey-Thakur/DEEPFAKE-AUDIO/blob/main/DEEPFAKE-AUDIO.ipynb
	#
	# 📜 LICENSE
	# Released under the MIT License
	# Release Date: 2021-02-06
	# ==================================================================================================

	# --- LIBRISPEECH MANIFEST ---
	librispeech_datasets = {
	"train": {
	"clean": ["LibriSpeech/train-clean-100", "LibriSpeech/train-clean-360"],
	"other": ["LibriSpeech/train-other-500"]
	},
	"test": {
	"clean": ["LibriSpeech/test-clean"],
	"other": ["LibriSpeech/test-other"]
	},
	"dev": {
	"clean": ["LibriSpeech/dev-clean"],
	"other": ["LibriSpeech/dev-other"]
	},
	}

	# --- LIBRITTS MANIFEST ---
	libritts_datasets = {
	"train": {
	"clean": ["LibriTTS/train-clean-100", "LibriTTS/train-clean-360"],
	"other": ["LibriTTS/train-other-500"]
	},
	"test": {
	"clean": ["LibriTTS/test-clean"],
	"other": ["LibriTTS/test-other"]
	},
	"dev": {
	"clean": ["LibriTTS/dev-clean"],
	"other": ["LibriTTS/dev-other"]
	},
	}

	# --- VOXCELEB MANIFEST (SPEAKER RECOGNITION) ---
	voxceleb_datasets = {
	"voxceleb1" : {
	"train": ["VoxCeleb1/wav"],
	"test": ["VoxCeleb1/test_wav"]
	},
	"voxceleb2" : {
	"train": ["VoxCeleb2/dev/aac"],
	"test": ["VoxCeleb2/test_wav"]
	}
	}

	# --- MISCELLANEOUS CORPORA ---
	other_datasets = [
	"LJSpeech-1.1",
	"VCTK-Corpus/wav48",
	]

	# --- LINGUISTIC CATEGORIZATION ---
	anglophone_nationalites = ["australia", "canada", "ireland", "uk", "usa"]