| |
| """Easy GUI (for RVC v2, with crepe) (with improved downloader) |
| |
| Automatically generated by Colaboratory. |
| |
| Original file is located at |
| https://colab.research.google.com/drive/1Gj6UTf2gicndUW_tVheVhTXIIYpFTYc7 |
| |
| ### RVC GENERAL COVER GUIDE: |
| https://docs.google.com/document/d/13_l1bd1Osgz7qlAZn-zhklCbHpVRk6bYOuAuB78qmsE/edit?usp=sharing |
| |
| ### RVC VOICE TRAINING GUIDE: |
| https://docs.google.com/document/d/13ebnzmeEBc6uzYCMt-QVFQk-whVrK4zw8k7_Lw3Bv_A/edit?usp=sharing |
| |
| ##**EDIT 6/17:** Easy GUI interface finally updated by Rejekts, the original colab author! |
| ####Major thanks and shoutout to him! Advanced settings have been added to a separate menu. If this new interface gives you troubles, simply enable the old interface again, or ping me @kalomaze in the AI HUB Discord. |
| |
| Keep in mind 'mangio-crepe' is superior to the other 'crepe' in both training and inference. The hop size won't be properly configurable otherwise. |
| |
| ##Step 1. Install (it will take 30-45 seconds) |
| |
| [](https://colab.research.google.com/github/liujing04/Retrieval-based-Voice-Conversion-WebUI/blob/main/Retrieval_based_Voice_Conversion_WebUI.ipynb) |
| If you want to open the ORIGINAL Colab go here! |
| """ |
|
|
| |
| !nvidia-smi |
|
|
| |
| |
| import os |
| import csv |
| import shutil |
| import tarfile |
| import subprocess |
| from pathlib import Path |
| from datetime import datetime |
|
|
| |
| ForceUpdateDependencies = False |
| |
| ForceTemporaryStorage = True |
|
|
| |
| if not ForceTemporaryStorage: |
| from google.colab import drive |
|
|
| if not os.path.exists('/content/drive'): |
| drive.mount('/content/drive') |
| else: |
| print('Drive is already mounted. Proceeding...') |
|
|
| |
| def install_packages(): |
| packages = ['build-essential', 'python3-dev', 'ffmpeg', 'aria2'] |
| pip_packages = ['pip', 'setuptools', 'wheel', 'httpx==0.23.0', 'faiss-gpu', 'fairseq', 'gradio==3.34.0', |
| 'ffmpeg', 'ffmpeg-python', 'praat-parselmouth', 'pyworld', 'numpy==1.23.5', |
| 'numba==0.56.4', 'librosa==0.9.2', 'mega.py', 'gdown', 'onnxruntime', 'pyngrok==4.1.12'] |
|
|
| print("Updating and installing system packages...") |
| for package in packages: |
| print(f"Installing {package}...") |
| subprocess.check_call(['apt-get', 'install', '-qq', '-y', package]) |
|
|
| print("Updating and installing pip packages...") |
| subprocess.check_call(['pip', 'install', '--upgrade'] + pip_packages) |
|
|
| print('Packages up to date.') |
|
|
| |
| def scan_and_write(base_path, output_file): |
| with open(output_file, 'w', newline='') as f: |
| writer = csv.writer(f) |
| for dirpath, dirs, files in os.walk(base_path): |
| for filename in files: |
| fname = os.path.join(dirpath, filename) |
| try: |
| mtime = os.path.getmtime(fname) |
| writer.writerow([fname, mtime]) |
| except Exception as e: |
| print(f'Skipping irrelevant nonexistent file {fname}: {str(e)}') |
| print(f'Finished recording filesystem timestamps to {output_file}.') |
|
|
| |
| def compare_files(old_file, new_file): |
| old_files = {} |
| new_files = {} |
|
|
| with open(old_file, 'r') as f: |
| reader = csv.reader(f) |
| old_files = {rows[0]:rows[1] for rows in reader} |
|
|
| with open(new_file, 'r') as f: |
| reader = csv.reader(f) |
| new_files = {rows[0]:rows[1] for rows in reader} |
|
|
| removed_files = old_files.keys() - new_files.keys() |
| added_files = new_files.keys() - old_files.keys() |
| unchanged_files = old_files.keys() & new_files.keys() |
|
|
| changed_files = {f for f in unchanged_files if old_files[f] != new_files[f]} |
|
|
| for file in removed_files: |
| print(f'File has been removed: {file}') |
|
|
| for file in changed_files: |
| print(f'File has been updated: {file}') |
|
|
| return list(added_files) + list(changed_files) |
|
|
| |
| if ForceTemporaryStorage: |
| file_path = '/content/CachedRVC.tar.gz' |
| else: |
| file_path = '/content/drive/MyDrive/RVC_Cached/CachedRVC.tar.gz' |
|
|
| content_file_path = '/content/CachedRVC.tar.gz' |
| extract_path = '/' |
|
|
| !pip install -q gTTS |
| !pip install -q elevenlabs |
|
|
| def extract_wav2lip_tar_files(): |
| !wget https://github.com/777gt/EVC/raw/main/wav2lip-HD.tar.gz |
| !wget https://github.com/777gt/EVC/raw/main/wav2lip-cache.tar.gz |
|
|
| with tarfile.open('/content/wav2lip-cache.tar.gz', 'r:gz') as tar: |
| for member in tar.getmembers(): |
| target_path = os.path.join('/', member.name) |
| try: |
| tar.extract(member, '/') |
| except: |
| pass |
|
|
| with tarfile.open('/content/wav2lip-HD.tar.gz') as tar: |
| tar.extractall('/content') |
|
|
| extract_wav2lip_tar_files() |
|
|
| if not os.path.exists(file_path): |
| folder_path = os.path.dirname(file_path) |
| os.makedirs(folder_path, exist_ok=True) |
| print('No cached dependency install found. Attempting to download GitHub backup..') |
|
|
| try: |
| download_url = "https://github.com/kalomaze/QuickMangioFixes/releases/download/release3/CachedRVC.tar.gz" |
| !wget -O $file_path $download_url |
| print('Download completed successfully!') |
| except Exception as e: |
| print('Download failed:', str(e)) |
|
|
| |
| if os.path.exists(file_path): |
| os.remove(file_path) |
| print('Failed download file deleted. Continuing manual backup..') |
|
|
| if Path(file_path).exists(): |
| if ForceTemporaryStorage: |
| print('Finished downloading CachedRVC.tar.gz.') |
| else: |
| print('CachedRVC.tar.gz found on Google Drive. Proceeding to copy and extract...') |
|
|
| |
| if ForceTemporaryStorage: |
| pass |
| else: |
| shutil.copy(file_path, content_file_path) |
|
|
| print('Beginning backup copy operation...') |
|
|
| with tarfile.open(content_file_path, 'r:gz') as tar: |
| for member in tar.getmembers(): |
| target_path = os.path.join(extract_path, member.name) |
| try: |
| tar.extract(member, extract_path) |
| except Exception as e: |
| print('Failed to extract a file (this isn\'t normal)... forcing an update to compensate') |
| ForceUpdateDependencies = True |
| print(f'Extraction of {content_file_path} to {extract_path} completed.') |
|
|
| if ForceUpdateDependencies: |
| install_packages() |
| ForceUpdateDependencies = False |
| else: |
| print('CachedRVC.tar.gz not found. Proceeding to create an index of all current files...') |
| scan_and_write('/usr/', '/content/usr_files.csv') |
|
|
| install_packages() |
|
|
| scan_and_write('/usr/', '/content/usr_files_new.csv') |
| changed_files = compare_files('/content/usr_files.csv', '/content/usr_files_new.csv') |
|
|
| with tarfile.open('/content/CachedRVC.tar.gz', 'w:gz') as new_tar: |
| for file in changed_files: |
| new_tar.add(file) |
| print(f'Added to tar: {file}') |
|
|
| os.makedirs('/content/drive/MyDrive/RVC_Cached', exist_ok=True) |
| shutil.copy('/content/CachedRVC.tar.gz', '/content/drive/MyDrive/RVC_Cached/CachedRVC.tar.gz') |
| print('Updated CachedRVC.tar.gz copied to Google Drive.') |
| print('Dependencies fully up to date; future runs should be faster.') |
|
|
| |
| import os |
|
|
| |
| os.chdir('/content/') |
|
|
| |
| def edit_file(file_path): |
| temp_file_path = "/tmp/temp_file.py" |
| changes_made = False |
| with open(file_path, "r") as file, open(temp_file_path, "w") as temp_file: |
| previous_line = "" |
| for line in file: |
| new_line = line.replace("value=160", "value=128") |
| if new_line != line: |
| print("Replaced 'value=160' with 'value=128'") |
| changes_made = True |
| line = new_line |
|
|
| new_line = line.replace("crepe hop length: 160", "crepe hop length: 128") |
| if new_line != line: |
| print("Replaced 'crepe hop length: 160' with 'crepe hop length: 128'") |
| changes_made = True |
| line = new_line |
|
|
| new_line = line.replace("value=0.88", "value=0.75") |
| if new_line != line: |
| print("Replaced 'value=0.88' with 'value=0.75'") |
| changes_made = True |
| line = new_line |
|
|
| if "label=i18n(\"输入源音量包络替换输出音量包络融合比例,越靠近1越使用输出包络\")" in previous_line and "value=1," in line: |
| new_line = line.replace("value=1,", "value=0.25,") |
| if new_line != line: |
| print("Replaced 'value=1,' with 'value=0.25,' based on the condition") |
| changes_made = True |
| line = new_line |
|
|
| if 'choices=["pm", "harvest", "dio", "crepe", "crepe-tiny", "mangio-crepe", "mangio-crepe-tiny"], # Fork Feature. Add Crepe-Tiny' in previous_line: |
| if 'value="pm",' in line: |
| new_line = line.replace('value="pm",', 'value="mangio-crepe",') |
| if new_line != line: |
| print("Replaced 'value=\"pm\",' with 'value=\"mangio-crepe\",' based on the condition") |
| changes_made = True |
| line = new_line |
|
|
| temp_file.write(line) |
| previous_line = line |
|
|
| |
| import shutil |
| shutil.move(temp_file_path, file_path) |
|
|
| if changes_made: |
| print("Changes made and file saved successfully.") |
| else: |
| print("No changes were needed.") |
|
|
| repo_path = '/content/Retrieval-based-Voice-Conversion-WebUI' |
| if not os.path.exists(repo_path): |
| |
| !git clone https://github.com/Mangio621/Mangio-RVC-Fork.git |
| os.chdir('/content/Mangio-RVC-Fork') |
| !wget https://github.com/777gt/EasyGUI-RVC-Fork/raw/main/EasierGUI.py |
| os.chdir('/content/') |
| !mv /content/Mangio-RVC-Fork /content/Retrieval-based-Voice-Conversion-WebUI |
| edit_file("/content/Retrieval-based-Voice-Conversion-WebUI/infer-web.py") |
| |
| !mkdir -p /content/Retrieval-based-Voice-Conversion-WebUI/audios |
| !wget https://github.com/777gt/EVC/raw/main/someguy.mp3 -O /content/Retrieval-based-Voice-Conversion-WebUI/audios/someguy.mp3 |
| !wget https://github.com/777gt/EVC/raw/main/somegirl.mp3 -O /content/Retrieval-based-Voice-Conversion-WebUI/audios/somegirl.mp3 |
| |
| !rm -rf /content/Retrieval-based-Voice-Conversion-WebUI/il8n/en_US.json |
| !wget https://github.com/kalomaze/QuickMangioFixes/releases/download/release3/en_US.json -P /content/Retrieval-based-Voice-Conversion-WebUI/il8n/ |
| else: |
| print(f"The repository already exists at {repo_path}. Skipping cloning.") |
|
|
| |
| !mkdir -p /content/Retrieval-based-Voice-Conversion-WebUI/stats/ |
| !wget -q https://cdn.discordapp.com/attachments/945486970883285045/1114717554481569802/peppy-generator-388800-07722f17a188.json -O /content/Retrieval-based-Voice-Conversion-WebUI/stats/peppy-generator-388800-07722f17a188.json |
|
|
| |
| !rm -rf /Retrieval-based-Voice-Conversion-WebUI/torchcrepe |
|
|
| |
| !git clone https://github.com/maxrmorrison/torchcrepe.git |
| !mv torchcrepe/torchcrepe Retrieval-based-Voice-Conversion-WebUI/ |
| !rm -rf torchcrepe |
|
|
| |
| os.chdir('/content/Retrieval-based-Voice-Conversion-WebUI') |
| !mkdir -p pretrained uvr5_weights |
|
|
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
|
|
| |
| |
|
|
| !aria2c --console-log-level=error -c -x 16 -s 16 -k 1M https://huggingface.co/lj1995/VoiceConversionWebUI/resolve/main/hubert_base.pt -d /content/Retrieval-based-Voice-Conversion-WebUI -o hubert_base.pt |
|
|
| |
| |
| |
|
|
| """##Models List: |
| ###You can download from **any** link you have as long as it's RVC. (Mega, Drive, etc.) |
| |
| Biggest organized voice collection at #voice-models in https://discord.gg/aihub |
| |
| Model archive spreadsheet, sorted by popularity: https://docs.google.com/spreadsheets/d/1tAUaQrEHYgRsm1Lvrnj14HFHDwJWl0Bd9x0QePewNco/ |
| |
| Backup model archive (outdated): https://huggingface.co/QuickWick/Music-AI-Voices/tree/main |
| """ |
|
|
| |
| |
|
|
| from mega import Mega |
| import os |
| import shutil |
| from urllib.parse import urlparse, parse_qs |
| import urllib.parse |
| from google.oauth2.service_account import Credentials |
| import gspread |
| import pandas as pd |
| from tqdm import tqdm |
| from bs4 import BeautifulSoup |
| import requests |
| import hashlib |
|
|
| def calculate_md5(file_path): |
| hash_md5 = hashlib.md5() |
| with open(file_path, "rb") as f: |
| for chunk in iter(lambda: f.read(4096), b""): |
| hash_md5.update(chunk) |
| return hash_md5.hexdigest() |
|
|
| |
| scope = ['https://www.googleapis.com/auth/spreadsheets', |
| 'https://www.googleapis.com/auth/drive.file', |
| 'https://www.googleapis.com/auth/drive'] |
|
|
| config_path = '/content/Retrieval-based-Voice-Conversion-WebUI/stats/peppy-generator-388800-07722f17a188.json' |
|
|
| if os.path.exists(config_path): |
| |
| creds = Credentials.from_service_account_file(config_path, scopes=scope) |
| client = gspread.authorize(creds) |
| else: |
| |
| print("Sheet credential file missing.") |
|
|
| |
| book = client.open("RVC Model Archive Sheet") |
| sheet = book.get_worksheet(3) |
|
|
| def update_sheet(url, filename, filesize, md5_hash, index_version): |
| data = sheet.get_all_records() |
| df = pd.DataFrame(data) |
|
|
| if md5_hash in df['MD5 Hash'].values: |
| idx = df[df['MD5 Hash'] == md5_hash].index[0] |
|
|
| |
| df.loc[idx, 'Download Counter'] = int(df.loc[idx, 'Download Counter']) + 1 |
| sheet.update_cell(idx+2, df.columns.get_loc('Download Counter') + 1, int(df.loc[idx, 'Download Counter'])) |
|
|
| |
| alt_url_cols = [col for col in df.columns if 'Alt URL' in col] |
| alt_url_values = [df.loc[idx, col_name] for col_name in alt_url_cols] |
|
|
| |
| if url not in alt_url_values and url != df.loc[idx, 'URL']: |
| for col_name in alt_url_cols: |
| if df.loc[idx, col_name] == '': |
| df.loc[idx, col_name] = url |
| sheet.update_cell(idx+2, df.columns.get_loc(col_name) + 1, url) |
| break |
| else: |
| |
| new_row_dict = {'URL': url, 'Download Counter': 1, 'Filename': filename, |
| 'Filesize (.pth)': filesize, 'MD5 Hash': md5_hash, 'RVC Version': index_version} |
|
|
| alt_url_cols = [col for col in df.columns if 'Alt URL' in col] |
| for col in alt_url_cols: |
| new_row_dict[col] = '' |
|
|
| |
| new_row_dict = {key: str(value) if key not in ['Download Counter', 'Filesize (.pth)'] else value for key, value in new_row_dict.items()} |
|
|
| |
| ordered_row = [new_row_dict.get(col, '') for col in df.columns] |
| sheet.append_row(ordered_row, value_input_option='RAW') |
|
|
| condition1 = False |
| condition2 = False |
| already_downloaded = False |
|
|
| |
|
|
| !rm -rf /content/unzips/ |
| !rm -rf /content/zips/ |
| !mkdir /content/unzips |
| !mkdir /content/zips |
|
|
| def sanitize_directory(directory): |
| for filename in os.listdir(directory): |
| file_path = os.path.join(directory, filename) |
| if os.path.isfile(file_path): |
| if filename == ".DS_Store" or filename.startswith("._"): |
| os.remove(file_path) |
| elif os.path.isdir(file_path): |
| sanitize_directory(file_path) |
|
|
| url = 'https://huggingface.co/Flyleaf/EltonJohnModern/resolve/main/2019Elton.zip' |
| model_zip = urlparse(url).path.split('/')[-2] + '.zip' |
| model_zip_path = '/content/zips/' + model_zip |
|
|
| |
| private_model = False |
|
|
| if url != '': |
| MODEL = "" |
| !mkdir -p /content/Retrieval-based-Voice-Conversion-WebUI/logs/$MODEL |
| !mkdir -p /content/zips/ |
| !mkdir -p /content/Retrieval-based-Voice-Conversion-WebUI/weights/ |
|
|
| if "drive.google.com" in url: |
| !gdown $url --fuzzy -O "$model_zip_path" |
| elif "/blob/" in url: |
| url = url.replace("blob", "resolve") |
| print("Resolved URL:", url) |
| !wget "$url" -O "$model_zip_path" |
| elif "mega.nz" in url: |
| m = Mega() |
| print("Starting download from MEGA....") |
| m.download_url(url, '/content/zips') |
| elif "/tree/main" in url: |
| response = requests.get(url) |
| soup = BeautifulSoup(response.content, 'html.parser') |
| temp_url = '' |
| for link in soup.find_all('a', href=True): |
| if link['href'].endswith('.zip'): |
| temp_url = link['href'] |
| break |
| if temp_url: |
| url = temp_url |
| print("Updated URL:", url) |
| url = url.replace("blob", "resolve") |
| print("Resolved URL:", url) |
|
|
| if "huggingface.co" not in url: |
| url = "https://huggingface.co" + url |
|
|
| !wget "$url" -O "$model_zip_path" |
| else: |
| print("No .zip file found on the page.") |
| |
| else: |
| !wget "$url" -O "$model_zip_path" |
|
|
| for filename in os.listdir("/content/zips"): |
| if filename.endswith(".zip"): |
| zip_file = os.path.join("/content/zips", filename) |
| shutil.unpack_archive(zip_file, "/content/unzips", 'zip') |
|
|
| sanitize_directory("/content/unzips") |
|
|
| def find_pth_file(folder): |
| for root, dirs, files in os.walk(folder): |
| for file in files: |
| if file.endswith(".pth"): |
| file_name = os.path.splitext(file)[0] |
| if file_name.startswith("G_") or file_name.startswith("P_"): |
| config_file = os.path.join(root, "config.json") |
| if os.path.isfile(config_file): |
| print("Outdated .pth detected! This is not compatible with the RVC method. Find the RVC equivalent model!") |
| continue |
| file_path = os.path.join(root, file) |
| if os.path.getsize(file_path) > 100 * 1024 * 1024: |
| print("Skipping unusable training file:", file) |
| continue |
| return file_name |
| return None |
|
|
| MODEL = find_pth_file("/content/unzips") |
| if MODEL is not None: |
| print("Found .pth file:", MODEL + ".pth") |
| else: |
| print("Error: Could not find a valid .pth file within the extracted zip.") |
| print("If there's an error above this talking about 'Access denied', try one of the Alt URLs in the Google Sheets for this model.") |
| MODEL = "" |
| global condition3 |
| condition3 = True |
|
|
| index_path = "" |
|
|
| def find_version_number(index_path): |
| if condition2 and not condition1: |
| if file_size >= 55180000: |
| return 'RVC v2' |
| else: |
| return 'RVC v1' |
|
|
| filename = os.path.basename(index_path) |
|
|
| if filename.endswith("_v2.index"): |
| return 'RVC v2' |
| elif filename.endswith("_v1.index"): |
| return 'RVC v1' |
| else: |
| if file_size >= 55180000: |
| return 'RVC v2' |
| else: |
| return 'RVC v1' |
|
|
| if MODEL != "": |
| |
| for root, dirs, files in os.walk('/content/unzips'): |
| for file in files: |
| file_path = os.path.join(root, file) |
| if file.endswith(".index"): |
| print("Found index file:", file) |
| condition1 = True |
| logs_folder = os.path.join('/content/Retrieval-based-Voice-Conversion-WebUI/logs', MODEL) |
| os.makedirs(logs_folder, exist_ok=True) |
|
|
| |
| if file.endswith(".index"): |
| identical_index_path = os.path.join(logs_folder, file) |
| if os.path.exists(identical_index_path): |
| os.remove(identical_index_path) |
|
|
| shutil.move(file_path, logs_folder) |
| index_path = os.path.join(logs_folder, file) |
|
|
| elif "G_" not in file and "D_" not in file and file.endswith(".pth"): |
| destination_path = f'/content/Retrieval-based-Voice-Conversion-WebUI/weights/{MODEL}.pth' |
| if os.path.exists(destination_path): |
| print("You already downloaded this model. Re-importing anyways..") |
| already_downloaded = True |
| shutil.move(file_path, destination_path) |
| condition2 = True |
| if already_downloaded is False and os.path.exists(config_path): |
| file_size = os.path.getsize(destination_path) |
| md5_hash = calculate_md5(destination_path) |
| index_version = find_version_number(index_path) |
|
|
| if condition1 is False: |
| logs_folder = os.path.join('/content/Retrieval-based-Voice-Conversion-WebUI/logs', MODEL) |
| os.makedirs(logs_folder, exist_ok=True) |
| |
|
|
| if condition2 and not condition1: |
| print("Model partially imported! No .index file was found in the model download. The author may have forgotten to add the index file.") |
| if already_downloaded is False and os.path.exists(config_path) and not private_model: |
| update_sheet(url, MODEL, file_size, md5_hash, index_version) |
|
|
| elif condition1 and condition2: |
| print("Model successfully imported!") |
| if already_downloaded is False and os.path.exists(config_path) and not private_model: |
| update_sheet(url, MODEL, file_size, md5_hash, index_version) |
|
|
| elif condition3: |
| pass |
| else: |
| print("URL cannot be left empty. If you don't want to download a model now, just skip this step.") |
|
|
| !rm -r /content/unzips/ |
| !rm -r /content/zips/ |
|
|
| """#Step 3. Start the GUI, then open the public URL. It's gonna look like this: |
|  |
| """ |
|
|
| |
| |
|
|
| |
| |
| easy_gui = True |
|
|
| if easy_gui: |
| !python3 EasierGUI.py --colab --pycmd python3 |
| else: |
| !python3 infer-web.py --colab --pycmd python3 |
|
|
| """* For the original RVC GUI, visit: https://github.com/RVC-Project/Retrieval-based-Voice-Conversion-WebUI |
| * If you need to train a model visit: https://colab.research.google.com/drive/1TU-kkQWVf-PLO_hSa2QCMZS1XF5xVHqs?usp=sharing |
| |
| #Other |
| """ |
|
|
| |
| |
| |
| from google.colab import files |
| from IPython.display import display, Javascript |
| import os |
| import shutil |
| import zipfile |
| import ipywidgets as widgets |
|
|
| |
| target_dir = '/content/Retrieval-based-Voice-Conversion-WebUI/audios/' |
| if not os.path.exists(target_dir): |
| os.makedirs(target_dir) |
|
|
| uploaded = files.upload() |
|
|
| for fn in uploaded.keys(): |
| |
| if fn.endswith('.zip'): |
| |
| zip_path = os.path.join(target_dir, fn) |
| with open(zip_path, 'wb') as f: |
| f.write(uploaded[fn]) |
|
|
| unzip_dir = os.path.join(target_dir, fn[:-4]) |
|
|
| |
| with zipfile.ZipFile(zip_path, 'r') as zip_ref: |
| zip_ref.extractall(unzip_dir) |
|
|
| |
| if os.path.exists(zip_path): |
| os.remove(zip_path) |
|
|
| print('Zip file "{name}" extracted and removed. Files are in: {folder}'.format(name=fn, folder=unzip_dir)) |
|
|
| |
| for extracted_file in os.listdir(unzip_dir): |
| extracted_file_path = os.path.join(unzip_dir, extracted_file) |
| extracted_file_length = os.path.getsize(extracted_file_path) |
|
|
| extracted_file_label = widgets.HTML( |
| value='Extracted file "{name}" with length {length} bytes'.format(name=extracted_file, length=extracted_file_length) |
| ) |
| display(extracted_file_label) |
|
|
| extracted_file_path_text = widgets.HTML( |
| value='File saved to: <a href="{}" target="_blank">{}</a>'.format(extracted_file_path, extracted_file_path) |
| ) |
|
|
| extracted_copy_button = widgets.Button(description='Copy') |
| extracted_copy_button_file_path = extracted_file_path |
|
|
| def copy_to_clipboard(b): |
| js_code = ''' |
| const el = document.createElement('textarea'); |
| el.value = "{path}"; |
| el.setAttribute('readonly', ''); |
| el.style.position = 'absolute'; |
| el.style.left = '-9999px'; |
| document.body.appendChild(el); |
| el.select(); |
| document.execCommand('copy'); |
| document.body.removeChild(el); |
| ''' |
| display(Javascript(js_code.format(path=extracted_copy_button_file_path))) |
|
|
| extracted_copy_button.on_click(copy_to_clipboard) |
| display(widgets.HBox([extracted_file_path_text, extracted_copy_button])) |
|
|
| continue |
|
|
| |
| |
| file_path = os.path.join(target_dir, fn) |
| with open(file_path, 'wb') as f: |
| f.write(uploaded[fn]) |
|
|
| file_length = len(uploaded[fn]) |
| file_label = widgets.HTML( |
| value='User uploaded file "{name}" with length {length} bytes'.format(name=fn, length=file_length) |
| ) |
| display(file_label) |
|
|
| |
| if fn.endswith('.pth') or fn.endswith('.index'): |
| warning_text = widgets.HTML( |
| value='<b style="color: red;">Warning:</b> You are uploading a model file in the wrong place. Please ensure it is uploaded to the correct location.' |
| ) |
| display(warning_text) |
|
|
| |
| file_path_text = widgets.HTML( |
| value='File saved to: <a href="{}" target="_blank">{}</a>'.format(file_path, file_path) |
| ) |
|
|
| copy_button = widgets.Button(description='Copy') |
| copy_button_file_path = file_path |
|
|
| def copy_to_clipboard(b): |
| js_code = ''' |
| const el = document.createElement('textarea'); |
| el.value = "{path}"; |
| el.setAttribute('readonly', ''); |
| el.style.position = 'absolute'; |
| el.style.left = '-9999px'; |
| document.body.appendChild(el); |
| el.select(); |
| document.execCommand('copy'); |
| document.body.removeChild(el); |
| ''' |
| display(Javascript(js_code.format(path=copy_button_file_path))) |
|
|
| copy_button.on_click(copy_to_clipboard) |
| display(widgets.HBox([file_path_text, copy_button])) |
|
|
| |
| for fn in uploaded.keys(): |
| if os.path.exists(os.path.join("/content/", fn)): |
| os.remove(os.path.join("/content/", fn)) |
|
|
| |
| |
| url = 'INSERTURLHERE' |
|
|
| import subprocess |
| import os |
| import shutil |
| from urllib.parse import urlparse, parse_qs |
| from google.colab import output |
| from google.colab import drive |
|
|
| mount_to_drive = True |
| mount_path = '/content/drive/MyDrive' |
|
|
| def mount(gdrive=False): |
| if gdrive: |
| if not os.path.exists("/content/drive/MyDrive"): |
| try: |
| drive.mount("/content/drive", force_remount=True) |
| except: |
| drive._mount("/content/drive", force_remount=True) |
| else: |
| pass |
|
|
| mount(mount_to_drive) |
|
|
| def check_package_installed(package_name): |
| command = f"pip show {package_name}" |
| result = subprocess.run(command.split(), stdout=subprocess.DEVNULL, stderr=subprocess.DEVNULL) |
| return result.returncode == 0 |
|
|
| def install_package(package_name): |
| command = f"pip install {package_name} --quiet" |
| subprocess.run(command.split(), stdout=subprocess.DEVNULL, stderr=subprocess.DEVNULL) |
|
|
| if not check_package_installed("mega.py"): |
| install_package("mega.py") |
|
|
| from mega import Mega |
| import os |
| import shutil |
| from urllib.parse import urlparse, parse_qs |
| import urllib.parse |
|
|
| !rm -rf /content/unzips/ |
| !rm -rf /content/zips/ |
| !mkdir /content/unzips |
| !mkdir /content/zips |
|
|
| def sanitize_directory(directory): |
| for filename in os.listdir(directory): |
| file_path = os.path.join(directory, filename) |
| if os.path.isfile(file_path): |
| if filename == ".DS_Store" or filename.startswith("._"): |
| os.remove(file_path) |
| elif os.path.isdir(file_path): |
| sanitize_directory(file_path) |
|
|
| audio_zip = urlparse(url).path.split('/')[-2] + '.zip' |
| audio_zip_path = '/content/zips/' + audio_zip |
|
|
| if url != '': |
| if "drive.google.com" in url: |
| !gdown $url --fuzzy -O "$audio_zip_path" |
| elif "mega.nz" in url: |
| m = Mega() |
| m.download_url(url, '/content/zips') |
| else: |
| !wget "$url" -O "$audio_zip_path" |
|
|
| for filename in os.listdir("/content/zips"): |
| if filename.endswith(".zip"): |
| zip_file = os.path.join("/content/zips", filename) |
| shutil.unpack_archive(zip_file, "/content/unzips", 'zip') |
|
|
| sanitize_directory("/content/unzips") |
|
|
| !mkdir -p /content/Retrieval-based-Voice-Conversion-WebUI/audios |
| for filename in os.listdir("/content/unzips"): |
| if filename.endswith((".wav", ".mp3", ".m4a", ".flac")): |
| audio_file = os.path.join("/content/unzips", filename) |
| destination_file = os.path.join("/content/Retrieval-based-Voice-Conversion-WebUI/audios", filename) |
| shutil.copy2(audio_file, destination_file) |
| if os.path.exists(destination_file): |
| print(f"Copy successful: {destination_file}") |
| else: |
| print(f"Copy failed: {audio_file}") |
|
|
| !rm -r /content/unzips/ |
| !rm -r /content/zips/ |
|
|
| """#**Consider subscribing to my Patreon!** |
| |
| Benefits include: |
| - Full on tech support for AI covers in general |
| - This includes audio mixing and how to train your own models, with any tier. |
| - Tech support priority is given to the latter tier. |
| |
| https://patreon.com/kalomaze |
| |
| Your support would be greatly appreciated! On top of maintaining this colab, I also write and maintain the Google Docs guides, and plan to create a video tutorial for training voices in the future. |
| |
| ##Credits |
| **Rejekts** - Original colab author. Made easy GUI for RVC<br> |
| **RVC-Project dev team** - Original RVC software developers <br> |
| **Mangio621** - Developer of the RVC fork that added crepe support, helped me get it up and running + taught me how to use TensorBoard<br> |
| **Kalomaze** - Creator of this colab, added autobackup + loader feature, fixed downloader to work with zips that had parentheses + streamlined downloader, added TensorBoard picture, made the doc thats linked, general God amongst men (def not biased 100%) |
| |
| #UVR Isolation Stuff |
| |
| ##UVR Colab Method (MDX-Net) |
| The following allows you to use the following models recommended for isolating acapellas for your covers: |
| - Kim vocal 1 |
| - Kim vocal 2 (higher quality, but may have more background vocals that need to be isolated with the Karaoke model) |
| |
| Or for the best instrumental results you can later do: |
| - Inst HQ 1 |
| |
| Reverb should be removed with Reverb HQ. Other remaining echo effects can be dealt with using the VR Architecture UVR colab linked below using the De-Echo models. (or done with local UVR) |
| """ |
|
|
| initialised = True |
| from time import sleep |
| from google.colab import output |
| from google.colab import drive |
|
|
| import sys |
| import os |
| import shutil |
| import psutil |
| import glob |
|
|
| mount_to_drive = True |
| mount_path = '/content/drive/MyDrive' |
|
|
| ai = 'https://github.com/kae0-0/Colab-for-MDX_B' |
| ai_version = 'https://github.com/kae0-0/Colab-for-MDX_B/raw/main/v' |
| onnx_list = 'https://raw.githubusercontent.com/kae0-0/Colab-for-MDX_B/main/onnx_list' |
| |
| |
| ForceUpdate = False |
| class h: |
| def __enter__(self): |
| self._original_stdout = sys.stdout |
| sys.stdout = open(os.devnull, 'w') |
| def __exit__(self, exc_type, exc_val, exc_tb): |
| sys.stdout.close() |
| sys.stdout = self._original_stdout |
| def get_size(bytes, suffix='B'): |
| global svmem |
| factor = 1024 |
| for unit in ["", "K", "M", "G", "T", "P"]: |
| if bytes < factor: |
| return f'{bytes:.2f}{unit}{suffix}' |
| bytes /= factor |
| svmem = psutil.virtual_memory() |
| def console(t): |
| get_ipython().system(t) |
| def LinUzip(file): |
| console(f'unzip -o {file}') |
| |
| def getONNX(): |
| console(f'wget {onnx_list} -O onnx_list') |
| _onnx = open("onnx_list", "r") |
| _onnx = _onnx.readlines() |
| os.remove('onnx_list') |
| for model in _onnx: |
| _model = sanitize_filename(os.path.basename(model)) |
| console(f'wget {model}') |
| LinUzip(_model) |
| os.remove(_model) |
|
|
| def getDemucs(_path): |
| |
| root = "https://dl.fbaipublicfiles.com/demucs/v3.0/" |
| model = { |
| 'demucs_extra': '3646af93' |
| } |
| for models in zip(model.keys(),model.values()): |
| console(f'wget {root+models[0]+"-"+models[1]}.th -O {models[0]}.th') |
| for _ in glob.glob('*.th'): |
| if os.path.isfile(os.path.join(os.getcwd(),_path,_)): |
| os.remove(os.path.join(os.getcwd(),_path,_)) |
| shutil.move(_,_path) |
|
|
| def mount(gdrive=False): |
| if gdrive: |
| if not os.path.exists("/content/drive/MyDrive"): |
| try: |
| drive.mount("/content/drive", force_remount=True) |
| except: |
| drive._mount("/content/drive", force_remount=True) |
| else: |
| pass |
|
|
| mount(mount_to_drive) |
|
|
| def toPath(path='local'): |
| if path == 'local': |
| os.chdir('/content') |
| elif path == 'gdrive': |
| os.chdir(mount_path) |
|
|
| def update(): |
| with h(): |
| console(f'wget {ai_version} -O nver') |
| f = open('nver', 'r') |
| nver = f.read() |
| f = open('v', 'r') |
| cver = f.read() |
| if nver != cver or ForceUpdate: |
| print('New update found! {}'.format(nver)) |
| os.chdir('../') |
| print('Updating ai...',end=' ') |
| with h(): |
| console(f'git clone {ai} temp_MDX_Colab') |
| console('cp -a temp_MDX_Colab/* MDX_Colab/') |
| console('rm -rf temp_MDX_Colab') |
| print('done') |
| os.chdir('MDX_Colab') |
| print('Refreshing models...', end=' ') |
| with h(): |
| |
| getONNX() |
| print('done') |
| output.clear() |
| os.remove('v') |
| os.rename("nver",'v') |
| |
| else: |
| os.remove('nver') |
| print('Using latest version.') |
|
|
| def past_installation(): |
| return os.path.exists('MDX_Colab') |
|
|
| def LoadMDX(): |
| console(f'git clone {ai} MDX_Colab') |
|
|
| |
| |
| print('Installing dependencies will take 45 seconds...',end=' ') |
|
|
| gpu_info = !nvidia-smi |
| gpu_info = '\n'.join(gpu_info) |
| if gpu_info.find('failed') >= 0: |
| svmem = psutil.virtual_memory() |
| gpu_runtime = False |
| with h(): |
| console('pip3 install onnxruntime==1.14.1') |
| else: |
| gpu_runtime = True |
| with h(): |
| console('pip3 install onnxruntime-gpu==1.14.1') |
| with h(): |
| deps = [ |
| 'pathvalidate', |
| 'youtube-dl', |
| 'django' |
| ] |
| for dep in deps: |
| console('pip3 install {}'.format(dep)) |
| |
| |
| console('pip3 install soundfile==0.12.1') |
| console('pip3 install librosa==0.9.1') |
| from pathvalidate import sanitize_filename |
| print('done') |
| if not gpu_runtime: |
| print(f'GPU runtime is disabled. You have {get_size(svmem.total)} RAM.\nProcessing will be incredibly slow. 😈') |
| elif gpu_info.find('Tesla T4') >= 0: |
| print('You got a Tesla T4 GPU. (speeds are around 10-25 it/s)') |
| elif gpu_info.find('Tesla P4') >= 0: |
| print('You got a Tesla P4 GPU. (speeds are around 8-22 it/s)') |
| elif gpu_info.find('Tesla K80') >= 0: |
| print('You got a Tesla K80 GPU. (This is the common gpu, speeds are around 2-10 it/s)') |
| elif gpu_info.find('Tesla P100') >= 0: |
| print('You got a Tesla P100 GPU. (This is the Second to the fastest gpu, speeds are around 15-42 it/s)') |
| else: |
| if gpu_runtime: |
| print('You got an unknown GPU. Please report the GPU you got!') |
| !nvidia-smi |
|
|
| |
| |
| |
| mount(mount_to_drive) |
| toPath('gdrive' if mount_to_drive else 'local') |
| |
| if not past_installation(): |
| print('First time installation will take around 3-6 minutes.\nThis requires around 2-3 GB Free Gdrive space.\nPlease try not to interup installation process!!') |
| print('Downloading AI...',end=' ') |
| with h(): |
| LoadMDX() |
| os.chdir('MDX_Colab') |
| print('done') |
|
|
| print('Downloading models...',end=' ') |
| with h(): |
| |
| getONNX() |
| if os.path.isfile('onnx_list'): |
| os.remove('onnx_list') |
| print('done') |
|
|
| else: |
| os.chdir('MDX_Colab') |
| update() |
|
|
| |
| |
| print('Success!') |
|
|
| |
| |
| |
| url = 'INSERTURLHERE' |
|
|
| import subprocess |
| import os |
| import shutil |
| from urllib.parse import urlparse, parse_qs |
| from google.colab import output |
| from google.colab import drive |
|
|
|
|
| mount_to_drive = True |
| mount_path = '/content/drive/MyDrive' |
|
|
| def mount(gdrive=False): |
| if gdrive: |
| if not os.path.exists("/content/drive/MyDrive"): |
| try: |
| drive.mount("/content/drive", force_remount=True) |
| except: |
| drive._mount("/content/drive", force_remount=True) |
| else: |
| pass |
|
|
| mount(mount_to_drive) |
|
|
| def check_package_installed(package_name): |
| command = f"pip show {package_name}" |
| result = subprocess.run(command.split(), stdout=subprocess.DEVNULL, stderr=subprocess.DEVNULL) |
| return result.returncode == 0 |
|
|
| def install_package(package_name): |
| command = f"pip install {package_name} --quiet" |
| subprocess.run(command.split(), stdout=subprocess.DEVNULL, stderr=subprocess.DEVNULL) |
|
|
| if not check_package_installed("mega.py"): |
| install_package("mega.py") |
|
|
| from mega import Mega |
| import os |
| import shutil |
| from urllib.parse import urlparse, parse_qs |
| import urllib.parse |
|
|
| !rm -rf /content/unzips/ |
| !rm -rf /content/zips/ |
| !mkdir /content/unzips |
| !mkdir /content/zips |
|
|
| def sanitize_directory(directory): |
| for filename in os.listdir(directory): |
| file_path = os.path.join(directory, filename) |
| if os.path.isfile(file_path): |
| if filename == ".DS_Store" or filename.startswith("._"): |
| os.remove(file_path) |
| elif os.path.isdir(file_path): |
| sanitize_directory(file_path) |
|
|
| audio_zip = urlparse(url).path.split('/')[-2] + '.zip' |
| audio_zip_path = '/content/zips/' + audio_zip |
|
|
| if url != '': |
| if "drive.google.com" in url: |
| !gdown $url --fuzzy -O "$audio_zip_path" |
| elif "mega.nz" in url: |
| m = Mega() |
| m.download_url(url, '/content/zips') |
| else: |
| !wget "$url" -O "$audio_zip_path" |
|
|
| for filename in os.listdir("/content/zips"): |
| if filename.endswith(".zip"): |
| zip_file = os.path.join("/content/zips", filename) |
| shutil.unpack_archive(zip_file, "/content/unzips", 'zip') |
|
|
| sanitize_directory("/content/unzips") |
|
|
| |
| !mkdir -p /content/drive/MyDrive/MDX_Colab/tracks |
| for filename in os.listdir("/content/unzips"): |
| if filename.endswith((".wav", ".mp3")): |
| audio_file = os.path.join("/content/unzips", filename) |
| destination_file = os.path.join("/content/drive/MyDrive/MDX_Colab/tracks", filename) |
| shutil.copy2(audio_file, destination_file) |
| if os.path.exists(destination_file): |
| print(f"Copy successful: {destination_file}") |
| else: |
| print(f"Copy failed: {audio_file}") |
|
|
| !rm -r /content/unzips/ |
| !rm -r /content/zips/ |
|
|
| """##Audio Isolation""" |
|
|
| |
| |
| |
|
|
| from google.colab import files |
| from IPython.display import display, Javascript |
| import os |
| import shutil |
| import zipfile |
| import ipywidgets as widgets |
|
|
| |
| target_dir = '/content/drive/MyDrive/MDX_Colab/tracks' |
| if not os.path.exists(target_dir): |
| os.makedirs(target_dir) |
|
|
| uploaded = files.upload() |
|
|
| for fn in uploaded.keys(): |
| |
| if fn.endswith('.zip'): |
| |
| zip_path = os.path.join(target_dir, fn) |
| with open(zip_path, 'wb') as f: |
| f.write(uploaded[fn]) |
|
|
| unzip_dir = os.path.join(target_dir, fn[:-4]) |
|
|
| |
| with zipfile.ZipFile(zip_path, 'r') as zip_ref: |
| zip_ref.extractall(unzip_dir) |
|
|
| |
| if os.path.exists(zip_path): |
| os.remove(zip_path) |
|
|
| print('Zip file "{name}" extracted and removed. Files are in: {folder}'.format(name=fn, folder=unzip_dir)) |
|
|
| |
| for extracted_file in os.listdir(unzip_dir): |
| extracted_file_path = os.path.join(unzip_dir, extracted_file) |
| extracted_file_length = os.path.getsize(extracted_file_path) |
|
|
| extracted_file_label = widgets.HTML( |
| value='Extracted file "{name}" with length {length} bytes'.format(name=extracted_file, length=extracted_file_length) |
| ) |
| display(extracted_file_label) |
|
|
| extracted_file_path_text = widgets.HTML( |
| value='File saved to: <a href="{}" target="_blank">{}</a>'.format(extracted_file_path, extracted_file_path) |
| ) |
|
|
| extracted_copy_button = widgets.Button(description='Copy') |
| extracted_copy_button_file_path = extracted_file_path |
|
|
| def copy_to_clipboard(b): |
| js_code = ''' |
| const el = document.createElement('textarea'); |
| el.value = "{path}"; |
| el.setAttribute('readonly', ''); |
| el.style.position = 'absolute'; |
| el.style.left = '-9999px'; |
| document.body.appendChild(el); |
| el.select(); |
| document.execCommand('copy'); |
| document.body.removeChild(el); |
| ''' |
| display(Javascript(js_code.format(path=extracted_copy_button_file_path))) |
|
|
| extracted_copy_button.on_click(copy_to_clipboard) |
| display(widgets.HBox([extracted_file_path_text, extracted_copy_button])) |
|
|
| continue |
|
|
| |
| |
| file_path = os.path.join(target_dir, fn) |
| with open(file_path, 'wb') as f: |
| f.write(uploaded[fn]) |
|
|
| file_length = len(uploaded[fn]) |
| file_label = widgets.HTML( |
| value='User uploaded file "{name}" with length {length} bytes'.format(name=fn, length=file_length) |
| ) |
| display(file_label) |
|
|
| |
| if fn.endswith('.pth') or fn.endswith('.index'): |
| warning_text = widgets.HTML( |
| value='<b style="color: red;">Warning:</b> You are uploading a model file in the wrong place. Please ensure it is uploaded to the correct location.' |
| ) |
| display(warning_text) |
|
|
| |
| file_path_text = widgets.HTML( |
| value='File saved to: <a href="{}" target="_blank">{}</a>'.format(file_path, file_path) |
| ) |
|
|
| copy_button = widgets.Button(description='Copy') |
| copy_button_file_path = file_path |
|
|
| def copy_to_clipboard(b): |
| js_code = ''' |
| const el = document.createElement('textarea'); |
| el.value = "{path}"; |
| el.setAttribute('readonly', ''); |
| el.style.position = 'absolute'; |
| el.style.left = '-9999px'; |
| document.body.appendChild(el); |
| el.select(); |
| document.execCommand('copy'); |
| document.body.removeChild(el); |
| ''' |
| display(Javascript(js_code.format(path=copy_button_file_path))) |
|
|
| copy_button.on_click(copy_to_clipboard) |
| display(widgets.HBox([file_path_text, copy_button])) |
|
|
| |
| for fn in uploaded.keys(): |
| if os.path.exists(os.path.join("/content/", fn)): |
| os.remove(os.path.join("/content/", fn)) |
|
|
| |
| for i in glob.glob('tracks/*'): |
| print(os.path.basename(i)) |
|
|
| if not 'initialised' in globals(): |
| raise NameError('Please run the first cell first!! #scrollTo=H_cTbwhVq4K6') |
|
|
| |
| import json |
| with open('model_data.json', 'r') as f: |
| model_data = json.load(f) |
|
|
| |
| tracks_path = 'tracks/' |
| separated_path = 'separated/' |
|
|
| |
| |
| track = "Butterfly.wav" |
|
|
| |
| |
| ONNX = "MDX-UVR Ins Model Full Band 498 (HQ_2)" |
| Demucs = 'off' |
|
|
| |
| |
| denoise = False |
| normalise = True |
| |
| amplitude_compensation = model_data[ONNX]["compensate"] |
| dim_f = model_data[ONNX]["mdx_dim_f_set"] |
| dim_t = model_data[ONNX]["mdx_dim_t_set"] |
| n_fft = model_data[ONNX]["mdx_n_fft_scale_set"] |
|
|
| mixing_algorithm = 'max_mag' |
| chunks = 55 |
| shifts = 10 |
|
|
| |
| track = track if 'http' in track else tracks_path+track |
| normalise = '--normalise' if normalise else '' |
| denoise = '--denoise' if denoise else '' |
|
|
| if ONNX == 'off': |
| pass |
| else: |
| ONNX = 'onnx/'+ONNX |
| if Demucs == 'off': |
| pass |
| else: |
| Demucs = 'model/'+Demucs+'.th' |
| |
| |
| bass = False |
| drums = False |
| others = False |
| vocals = True |
| |
| |
| invert_bass = False |
| invert_drums = False |
| invert_others = False |
| invert_vocals = True |
| invert_stems = [] |
| stems = [] |
| if bass: |
| stems.append('b') |
| if drums: |
| stems.append('d') |
| if others: |
| stems.append('o') |
| if vocals: |
| stems.append('v') |
|
|
| invert_stems = [] |
| if invert_bass: |
| invert_stems.append('b') |
| if invert_drums: |
| invert_stems.append('d') |
| if invert_others: |
| invert_stems.append('o') |
| if invert_vocals: |
| invert_stems.append('v') |
|
|
| margin = 44100 |
|
|
| |
| |
| |
|
|
| console(f"python main.py --n_fft {n_fft} --dim_f {dim_f} --dim_t {dim_t} --margin {margin} -i \"{track}\" --mixing {mixing_algorithm} --onnx \"{ONNX}\" --model {Demucs} --shifts {round(shifts)} --stems {''.join(stems)} --invert {''.join(invert_stems)} --chunks {chunks} --compensate {amplitude_compensation} {normalise} {denoise}") |
|
|
| """<sup>Models provided are from [Kuielab](https://github.com/kuielab/mdx-net-submission/), [UVR](https://github.com/Anjok07/ultimatevocalremovergui/) and [Kim](https://github.com/KimberleyJensen/) <br> (you can support UVR [here](https://www.buymeacoffee.com/uvr5/vip-model-download-instructions) and [here](https://boosty.to/uvr)).</sup></br> |
| <sup>Original UVR notebook by [Audio Hacker](https://www.youtube.com/channel/UC0NiSV1jLMH-9E09wiDVFYw/), modified by Audio Separation community & then kalomaze (for RVC colab).</sup></br> |
| <sup>Big thanks to the [Audio Separation Discord](https://discord.gg/zeYU2Wzbgj) for helping me implement this in the colab.</sup></br> |
| |
| ##**UVR Colab Settings explanation**<br> |
| |
| The defaults already provided are generally recommended. However, if you would like to try tweaking them, here's an explanation: |
| |
| *Mixing algorithm* - max_mag - is generally for vocals (gives the most residues in instrumentals), min_mag - for instrumentals (the most aggresive) though "min_mag solve some un-wanted vocal soundings, but instrumental [is] more muffled and less detailed". Check out also "default" as it's in between both - a.k.a. average (it's also required for Demucs enabled which works only for vocal models).<br> |
| |
| *Chunks* - Set it to 55 or 40 (less aggressive) to alleviate some occasional instrument dissapearing. |
| Set 1 for the best clarity. It works for at least instrumental model (4:15 track, at least for Tesla T4 (shown at the top) generally better quality, but some instruments tend to disappear more using 1 than 10. For Demucs enabled and/or vocal model it can be set to 10 if your track is below 5:00 minutes. The more chunks, the faster separation up to ~40. For 4:15 track, 72 is max supported till memory allocation error shows up (disabled chunks returns error too). <br> |
| |
| *Shifts* - can be set max to 10, but it only slightly increases SDR, while processing time is 1.7x longer for each shift and it gives similar result to shifts 5. |
| |
| *Normalization* - "normalizes all input at first and then changes the wave peak back to original. This makes the separation process better, also less noise" (e.g. if you have to noisy hihats or big amplitude compensation - disable it). |
| <br> |
| |
| *Demucs* enabled works correctly with mixing algorithm set to default and only with vocal models (Kim and 427). It's also the only option to get rid of noise of MDX models. Normalization enabled is necessary (but that cnfiguration has slightly more vocal residues than instrumental model). Decrease chunks to 40 if you have ONNXRuntimeError with Demucs on (it requires lower chunks). |
| <br> |
| |
| ##**Recommended models**<br> |
| |
| For vocals (by raw SDR output, not factoring in manual cleanup): |
| - Kim vocal 2 (less instrumental residues in vocal stem) |
| - Kim vocal 1 |
| <br>or alternatively |
| - 427 |
| - 406 |
| |
| For best lead vocals: |
| - Karaokee 2 |
| |
| For best backing vocals: |
| - [HP_KAROKEE-MSB2-3BAND-3090](https://colab.research.google.com/drive/16Q44VBJiIrXOgTINztVDVeb0XKhLKHwl?usp=sharing) |
| |
| It's rather inconvenient that the VR Architecture models aren't here and have to be run through the above colab, but they can't coexist in the same colab as of right now. I will attempting a better solution in the future. |
| """ |