MDX-Net (code, colab, models)
Browse files- .gitattributes +1 -0
- KUIELab-MDX-Net. A Two-Stream Neural Network for Music Demixing.pdf +3 -0
- code/mdx-net [KimberleyJensen] +77 -6.zip +3 -0
- code/mdx-net.zip +3 -0
- code/sdx23 [ws-choi] +43.zip +3 -0
- colab/MDX_Net_Colab.ipynb +569 -0
- models/MDXCENTRE/.gitattributes +35 -0
- models/MDXCENTRE/config_mdx23c_similarity.yaml +89 -0
- models/MDXCENTRE/model_mdx23c_ep_237_l1_freq_71.9982.ckpt +3 -0
- models/MDXCENTRE/source.txt +1 -0
- models/UVR5-MDX-NET-VIP-MODELS/.gitattributes +35 -0
- models/UVR5-MDX-NET-VIP-MODELS/MDX23C-8KFFT-InstVoc_HQ_2.ckpt +3 -0
- models/UVR5-MDX-NET-VIP-MODELS/README.md +3 -0
- models/UVR5-MDX-NET-VIP-MODELS/UVR-MDX-NET-Inst_full_292.onnx +3 -0
- models/UVR5-MDX-NET-VIP-MODELS/UVR-MDX-NET_Inst_187_beta.onnx +3 -0
- models/UVR5-MDX-NET-VIP-MODELS/UVR-MDX-NET_Inst_82_beta.onnx +3 -0
- models/UVR5-MDX-NET-VIP-MODELS/UVR-MDX-NET_Inst_90_beta.onnx +3 -0
- models/UVR5-MDX-NET-VIP-MODELS/UVR-MDX-NET_Main_340.onnx +3 -0
- models/UVR5-MDX-NET-VIP-MODELS/UVR-MDX-NET_Main_390.onnx +3 -0
- models/UVR5-MDX-NET-VIP-MODELS/UVR-MDX-NET_Main_406.onnx +3 -0
- models/UVR5-MDX-NET-VIP-MODELS/UVR-MDX-NET_Main_427.onnx +3 -0
- models/UVR5-MDX-NET-VIP-MODELS/UVR-MDX-NET_Main_438.onnx +3 -0
- models/UVR5-MDX-NET-VIP-MODELS/source.txt +1 -0
- models/aufr33_jarredou_MDXv3_DeReverb/.gitattributes +35 -0
- models/aufr33_jarredou_MDXv3_DeReverb/config_dereverb_mdx23c.yaml +135 -0
- models/aufr33_jarredou_MDXv3_DeReverb/dereverb_mdx23c_sdr_6.9096.ckpt +3 -0
- models/aufr33_jarredou_MDXv3_DeReverb/source.txt +1 -0
- models/mdxnet/.gitattributes +35 -0
- models/mdxnet/README.md +8 -0
- models/mdxnet/UVR-MDX-NET-Inst_HQ_3.onnx +3 -0
- models/mdxnet/UVR-MDX-NET-Voc_FT.onnx +3 -0
- models/mdxnet/UVR_MDXNET_KARA_2.onnx +3 -0
- models/mdxnet/model_data.json +50 -0
- models/mdxnet/source.txt +1 -0
.gitattributes
CHANGED
|
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
| 33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
| 33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
| 36 |
+
KUIELab-MDX-Net.[[:space:]]A[[:space:]]Two-Stream[[:space:]]Neural[[:space:]]Network[[:space:]]for[[:space:]]Music[[:space:]]Demixing.pdf filter=lfs diff=lfs merge=lfs -text
|
KUIELab-MDX-Net. A Two-Stream Neural Network for Music Demixing.pdf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:91429fab5485c961d53f97a12570ac1d6b5879e1db4b025207d1801d5a22c65d
|
| 3 |
+
size 955875
|
code/mdx-net [KimberleyJensen] +77 -6.zip
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1cddf827a1afca3a1a93efa47ecfa2a14c077b63c0a6a589bdae7790cba1deda
|
| 3 |
+
size 13900269
|
code/mdx-net.zip
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:95789b4287f39011b05c7b73fdcc537af667a067c996c0b6407e2fb7f58cd6ae
|
| 3 |
+
size 13902046
|
code/sdx23 [ws-choi] +43.zip
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4e6be2629dcca93e3fc4913111b7a8834c3c3e39caa200f05297170ba27f6dd1
|
| 3 |
+
size 14059340
|
colab/MDX_Net_Colab.ipynb
ADDED
|
@@ -0,0 +1,569 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"cells": [
|
| 3 |
+
{
|
| 4 |
+
"cell_type": "markdown",
|
| 5 |
+
"metadata": {
|
| 6 |
+
"id": "wX9xzLur4tus"
|
| 7 |
+
},
|
| 8 |
+
"source": [
|
| 9 |
+
"# MDX-Net Colab\n",
|
| 10 |
+
"<div style=\"display:flex; align-items:center; font-size: 16px;\">\n",
|
| 11 |
+
" <img src=\"https://github.githubassets.com/pinned-octocat.svg\" alt=\"icon1\" style=\"margin-right:10px; height: 20px;\" width=\"1.5%\">\n",
|
| 12 |
+
" <span>Trained models provided in this notebook are from <a href=\"https://github.com/Anjok07\">UVR-GUI</a>.</span>\n",
|
| 13 |
+
"</div>\n",
|
| 14 |
+
"<div style=\"display:flex; align-items:center; font-size: 16px;\">\n",
|
| 15 |
+
" <img src=\"https://github.com/Anjok07/ultimatevocalremovergui/raw/master/gui_data/img/GUI-Icon.ico\" alt=\"icon2\" style=\"margin-right:10px; height: 20px;margin-top:10px\" width=\"1.5%\">\n",
|
| 16 |
+
" <span>OFFICIAL UVR GITHUB PAGE: <a href=\"https://github.com/Anjok07/ultimatevocalremovergui\">here</a>.</span>\n",
|
| 17 |
+
"</div>\n",
|
| 18 |
+
"<div style=\"display:flex; align-items:center; font-size: 16px;\">\n",
|
| 19 |
+
" <img src=\"https://avatars.githubusercontent.com/u/24620594\" alt=\"icon3\" style=\"margin-right:10px; height: 20px;\" width=\"1.5%\">\n",
|
| 20 |
+
" <span>OFFICIAL CLI Version: <a href=\"https://github.com/tsurumeso/vocal-remover\">here</a>.</span>\n",
|
| 21 |
+
"</div>\n",
|
| 22 |
+
"<div style=\"display:flex; align-items:center; font-size: 16px;\">\n",
|
| 23 |
+
" <img src=\"https://icons.getbootstrap.com/assets/icons/discord.svg\" alt=\"icon4\" style=\"margin-right:10px; height: 20px;\" width=\"1.5%\">\n",
|
| 24 |
+
" <span>Join our <a href=\"https://cutt.ly/0TcDjmo\">Discord server</a>!</span>\n",
|
| 25 |
+
"</div>\n",
|
| 26 |
+
"<sup><br>Ultimate Vocal Remover (unofficial)</sup>\n",
|
| 27 |
+
"<sup><br>MDX-Net by <a href=\"https://github.com/kuielab\">kuielab</a> and adapted for Colaboratory by <a href=\"https://www.youtube.com/channel/UC0NiSV1jLMH-9E09wiDVFYw\">AudioHacker</a>.</sup>\n",
|
| 28 |
+
"\n",
|
| 29 |
+
"<sup><br>Your support means a lot to me. If you enjoy my work, please consider buying me a ko-fi:<br></sup>\n",
|
| 30 |
+
"[](https://ko-fi.com/X8X6M8FR0)<br>\n"
|
| 31 |
+
]
|
| 32 |
+
},
|
| 33 |
+
{
|
| 34 |
+
"cell_type": "markdown",
|
| 35 |
+
"source": [
|
| 36 |
+
"Common issues\n",
|
| 37 |
+
"\n",
|
| 38 |
+
"- For \"OSError: [Errno 107] Transport endpoint is not connected\", go to Environment and launch session again, then rerun that cell.<br>\n",
|
| 39 |
+
"- For \"credential propagation unsuccessful\" error, go to Environment, kill the environment, wait 30-40s (or potentially click refresh button in the file manager) and start over. <br>\n",
|
| 40 |
+
"- If you exceed GPU Colab limit for free users, switch Google account in the right corner, and use the same account for GDrive. <br>\n",
|
| 41 |
+
"- Grant all the privileges for GDrive, or you'll see mounting error.<br>\n",
|
| 42 |
+
"\n",
|
| 43 |
+
"\n"
|
| 44 |
+
],
|
| 45 |
+
"metadata": {
|
| 46 |
+
"id": "aywwSSWivQy_"
|
| 47 |
+
}
|
| 48 |
+
},
|
| 49 |
+
{
|
| 50 |
+
"cell_type": "code",
|
| 51 |
+
"execution_count": null,
|
| 52 |
+
"metadata": {
|
| 53 |
+
"cellView": "form",
|
| 54 |
+
"id": "3J69RV7G8ocb"
|
| 55 |
+
},
|
| 56 |
+
"outputs": [],
|
| 57 |
+
"source": [
|
| 58 |
+
"#@markdown ### Initialization\n",
|
| 59 |
+
"import importlib.metadata\n",
|
| 60 |
+
"\n",
|
| 61 |
+
"desired_version = \"1.26.0\"\n",
|
| 62 |
+
"\n",
|
| 63 |
+
"try:\n",
|
| 64 |
+
" installed_version = importlib.metadata.version(\"numpy\")\n",
|
| 65 |
+
" if installed_version == desired_version:\n",
|
| 66 |
+
" print(f\"NumPy {desired_version} is already installed.\")\n",
|
| 67 |
+
" else:\n",
|
| 68 |
+
" print(f\"Installing NumPy {desired_version} (current: {installed_version})...\")\n",
|
| 69 |
+
" !pip install numpy=={desired_version} --prefer-binary\n",
|
| 70 |
+
" import os\n",
|
| 71 |
+
" os._exit(00) # Restart runtime for changes to take effect\n",
|
| 72 |
+
"except importlib.metadata.PackageNotFoundError:\n",
|
| 73 |
+
" print(f\"NumPy is not installed. Installing {desired_version}...\")\n",
|
| 74 |
+
" !pip install numpy=={desired_version} --prefer-binary\n",
|
| 75 |
+
" import os\n",
|
| 76 |
+
" os._exit(00)\n",
|
| 77 |
+
"\n",
|
| 78 |
+
"%cd /content\n",
|
| 79 |
+
"import json\n",
|
| 80 |
+
"import os\n",
|
| 81 |
+
"import os.path\n",
|
| 82 |
+
"import gc\n",
|
| 83 |
+
"import psutil\n",
|
| 84 |
+
"import requests\n",
|
| 85 |
+
"import subprocess\n",
|
| 86 |
+
"import glob\n",
|
| 87 |
+
"import time\n",
|
| 88 |
+
"import logging\n",
|
| 89 |
+
"import sys\n",
|
| 90 |
+
"from bs4 import BeautifulSoup\n",
|
| 91 |
+
"from google.colab import drive, files, output\n",
|
| 92 |
+
"from IPython.display import Audio, display\n",
|
| 93 |
+
"\n",
|
| 94 |
+
"if \"first_cell_ran\" in locals():\n",
|
| 95 |
+
" print(\"You've ran this cell for this session. No need to run it again.\\nif you think something went wrong or you want to change mounting path, restart the runtime.\")\n",
|
| 96 |
+
"else:\n",
|
| 97 |
+
" print('Setting up... Please wait around 1-2 minute(s).')\n",
|
| 98 |
+
"\n",
|
| 99 |
+
" branch = \"https://github.com/NaJeongMo/Colab-for-MDX_B\"\n",
|
| 100 |
+
"\n",
|
| 101 |
+
" model_params = \"https://raw.githubusercontent.com/TRvlvr/application_data/main/mdx_model_data/model_data_new.json\"\n",
|
| 102 |
+
" _Models = \"https://github.com/TRvlvr/model_repo/releases/download/all_public_uvr_models/\"\n",
|
| 103 |
+
" # _models = \"https://pastebin.com/raw/jBzYB8vz\"\n",
|
| 104 |
+
" _models = \"https://raw.githubusercontent.com/TRvlvr/application_data/main/filelists/download_checks.json\"\n",
|
| 105 |
+
" stem_naming = \"https://pastebin.com/raw/mpH4hRcF\"\n",
|
| 106 |
+
" arl_check_endpoint = 'https://dz.doubledouble.top/check' # param: arl?=<>\n",
|
| 107 |
+
"\n",
|
| 108 |
+
" file_folder = \"Colab-for-MDX_B\"\n",
|
| 109 |
+
"\n",
|
| 110 |
+
" model_ids = requests.get(_models).json()\n",
|
| 111 |
+
" model_ids = model_ids[\"mdx_download_list\"].values()\n",
|
| 112 |
+
"\n",
|
| 113 |
+
" model_params = requests.get(model_params).json()\n",
|
| 114 |
+
" stem_naming = requests.get(stem_naming).json()\n",
|
| 115 |
+
"\n",
|
| 116 |
+
" os.makedirs(\"tmp_models\", exist_ok=True)\n",
|
| 117 |
+
" # @markdown Start the cell below, and when Numpy has been installed, run that cell again (so when you'll see the session crash info) - do that on every first Colab launch from now now to finish the Colab initialization, then continue below. <br> <br>If you don't wish to mount Google Drive, uncheck this box.\n",
|
| 118 |
+
" MountDrive = True # @param{type:\"boolean\"}\n",
|
| 119 |
+
" # @markdown The path for the drive to be mounted: Please be cautious when modifying this as it can cause issues if not done properly.\n",
|
| 120 |
+
" mounting_path = \"/content/drive/MyDrive\" # @param [\"snippets:\",\"/content/drive/MyDrive\",\"/content/drive/Shareddrives/<your shared drive name>\", \"/content/drive/Shareddrives/Shared Drive\"]{allow-input: true}\n",
|
| 121 |
+
" # @markdown Force update and disregard local changes: discards all local modifications in your repository, effectively replacing all files with the versions from the original commit.\n",
|
| 122 |
+
" force_update = False # @param{type:\"boolean\"}\n",
|
| 123 |
+
" # @markdown Auto Update (does not discard your changes)\n",
|
| 124 |
+
" auto_update = True # @param{type:\"boolean\"}\n",
|
| 125 |
+
"\n",
|
| 126 |
+
" #testing\n",
|
| 127 |
+
" #!python -m pip install numpy==1.26\n",
|
| 128 |
+
" #!pip install numpy==1.25.2\n",
|
| 129 |
+
" #!pip install torch==1.13.1\n",
|
| 130 |
+
" #!python -m pip install scipy==1.13.1\n",
|
| 131 |
+
"\n",
|
| 132 |
+
" #onnxruntime-gpu fix\n",
|
| 133 |
+
" !python -m pip install ort-nightly-gpu --index-url=https://aiinfra.pkgs.visualstudio.com/PublicPackages/_packaging/ort-cuda-12-nightly/pypi/simple/\n",
|
| 134 |
+
" !pip install onnxruntime-gpu==1.21.0\n",
|
| 135 |
+
"\n",
|
| 136 |
+
" reqs_apt = [] # !sudo apt-get install\n",
|
| 137 |
+
" reqs_pip = [\"librosa\", \"deemix\", \"yt_dlp\"] # pip3 install\n",
|
| 138 |
+
"\n",
|
| 139 |
+
" class hide_opt: # hide outputs\n",
|
| 140 |
+
" def __enter__(self):\n",
|
| 141 |
+
" self._original_stdout = sys.stdout\n",
|
| 142 |
+
" sys.stdout = open(os.devnull, \"w\")\n",
|
| 143 |
+
"\n",
|
| 144 |
+
" def __exit__(self, exc_type, exc_val, exc_tb):\n",
|
| 145 |
+
" sys.stdout.close()\n",
|
| 146 |
+
" sys.stdout = self._original_stdout\n",
|
| 147 |
+
"\n",
|
| 148 |
+
" def get_size(bytes, suffix=\"B\"): # read ram\n",
|
| 149 |
+
" global svmem\n",
|
| 150 |
+
" factor = 1024\n",
|
| 151 |
+
" for unit in [\"\", \"K\", \"M\", \"G\", \"T\", \"P\"]:\n",
|
| 152 |
+
" if bytes < factor:\n",
|
| 153 |
+
" return f\"{bytes:.2f}{unit}{suffix}\"\n",
|
| 154 |
+
" bytes /= factor\n",
|
| 155 |
+
" svmem = psutil.virtual_memory()\n",
|
| 156 |
+
"\n",
|
| 157 |
+
"\n",
|
| 158 |
+
" print('installing requirements...',end=' ')\n",
|
| 159 |
+
" with hide_opt():\n",
|
| 160 |
+
" for x in reqs_apt:\n",
|
| 161 |
+
" subprocess.run([\"sudo\", \"apt-get\", \"install\", x])\n",
|
| 162 |
+
" for x in reqs_pip:\n",
|
| 163 |
+
" subprocess.run([\"python3\", \"-m\", \"pip\", \"install\", x])\n",
|
| 164 |
+
" print('done')\n",
|
| 165 |
+
"\n",
|
| 166 |
+
" def install_or_mount_drive():\n",
|
| 167 |
+
" print(\n",
|
| 168 |
+
" \"Please log in to your account by following the prompts in the pop-up tab.\\nThis step is necessary to install the files to your Google Drive.\\nIf you have any concerns about the safety of this notebook, you can choose not to mount your drive by unchecking the \\\"MountDrive\\\" checkbox.\"\n",
|
| 169 |
+
" )\n",
|
| 170 |
+
" drive.mount(\"/content/drive\", force_remount=True)\n",
|
| 171 |
+
" os.chdir(mounting_path)\n",
|
| 172 |
+
" # check if previous installation is done\n",
|
| 173 |
+
" if os.path.exists(os.path.join(mounting_path, file_folder)):\n",
|
| 174 |
+
" # update checking\n",
|
| 175 |
+
" os.chdir(file_folder)\n",
|
| 176 |
+
"\n",
|
| 177 |
+
" if force_update:\n",
|
| 178 |
+
" print('Force updating...')\n",
|
| 179 |
+
"\n",
|
| 180 |
+
" commands = [\n",
|
| 181 |
+
" [\"git\", \"pull\"],\n",
|
| 182 |
+
" [\"git\", \"checkout\", \"--\", \".\"],\n",
|
| 183 |
+
" ]\n",
|
| 184 |
+
"\n",
|
| 185 |
+
" for cmd in commands:\n",
|
| 186 |
+
" subprocess.run(cmd)\n",
|
| 187 |
+
"\n",
|
| 188 |
+
" elif auto_update:\n",
|
| 189 |
+
" print('Checking for updates...')\n",
|
| 190 |
+
" commands = [\n",
|
| 191 |
+
" [\"git\", \"pull\"],\n",
|
| 192 |
+
" ]\n",
|
| 193 |
+
"\n",
|
| 194 |
+
" for cmd in commands:\n",
|
| 195 |
+
" subprocess.run(cmd)\n",
|
| 196 |
+
" else:\n",
|
| 197 |
+
" subprocess.run([\"git\", \"clone\", \"https://github.com/NaJeongMo/Colab-for-MDX_B.git\"])\n",
|
| 198 |
+
" os.chdir(file_folder)\n",
|
| 199 |
+
"\n",
|
| 200 |
+
" def use_uvr_without_saving():\n",
|
| 201 |
+
" global mounting_path\n",
|
| 202 |
+
" print(\"Notice: files won't be saved to personal drive.\")\n",
|
| 203 |
+
" print(f\"Downloading {file_folder}...\", end=\" \")\n",
|
| 204 |
+
" mounting_path = \"/content\"\n",
|
| 205 |
+
" with hide_opt():\n",
|
| 206 |
+
" os.chdir(mounting_path)\n",
|
| 207 |
+
" subprocess.run([\"git\", \"clone\", \"https://github.com/NaJeongMo/Colab-for-MDX_B.git\"])\n",
|
| 208 |
+
" os.chdir(file_folder)\n",
|
| 209 |
+
"\n",
|
| 210 |
+
" if MountDrive:\n",
|
| 211 |
+
" install_or_mount_drive()\n",
|
| 212 |
+
" else:\n",
|
| 213 |
+
" use_uvr_without_saving()\n",
|
| 214 |
+
" print(\"done!\")\n",
|
| 215 |
+
" if not os.path.exists(\"tracks\"):\n",
|
| 216 |
+
" os.mkdir(\"tracks\")\n",
|
| 217 |
+
"\n",
|
| 218 |
+
" print('Importing required libraries...',end=' ')\n",
|
| 219 |
+
"\n",
|
| 220 |
+
" import os\n",
|
| 221 |
+
" import mdx\n",
|
| 222 |
+
" import librosa\n",
|
| 223 |
+
" import torch\n",
|
| 224 |
+
" import soundfile as sf\n",
|
| 225 |
+
" import numpy as np\n",
|
| 226 |
+
" import yt_dlp\n",
|
| 227 |
+
"\n",
|
| 228 |
+
" from deezer import Deezer\n",
|
| 229 |
+
" from deezer import TrackFormats\n",
|
| 230 |
+
" import deemix\n",
|
| 231 |
+
" from deemix.settings import load as loadSettings\n",
|
| 232 |
+
" from deemix.downloader import Downloader\n",
|
| 233 |
+
" from deemix import generateDownloadObject\n",
|
| 234 |
+
"\n",
|
| 235 |
+
" logger = logging.getLogger(\"yt_dlp\")\n",
|
| 236 |
+
" logger.setLevel(logging.ERROR)\n",
|
| 237 |
+
"\n",
|
| 238 |
+
" def id_to_ptm(mkey):\n",
|
| 239 |
+
" if mkey in model_ids:\n",
|
| 240 |
+
" mpath = f\"/content/tmp_models/{mkey}\"\n",
|
| 241 |
+
" if not os.path.exists(f'/content/tmp_models/{mkey}'):\n",
|
| 242 |
+
" print('Downloading model...',end=' ')\n",
|
| 243 |
+
" subprocess.run(\n",
|
| 244 |
+
" [\"wget\", _Models+mkey, \"-O\", mpath]\n",
|
| 245 |
+
" )\n",
|
| 246 |
+
" print(f'saved to {mpath}')\n",
|
| 247 |
+
" # get_ipython().system(f'gdown {model_id} -O /content/tmp_models/{mkey}')\n",
|
| 248 |
+
" return mpath\n",
|
| 249 |
+
" else:\n",
|
| 250 |
+
" return mpath\n",
|
| 251 |
+
" else:\n",
|
| 252 |
+
" mpath = f'models/{mkey}'\n",
|
| 253 |
+
" return mpath\n",
|
| 254 |
+
"\n",
|
| 255 |
+
" def prepare_mdx(custom_param=False, dim_f=None, dim_t=None, n_fft=None, stem_name=None, compensation=None):\n",
|
| 256 |
+
" device = torch.device('cuda:0') if torch.cuda.is_available() else torch.device('cpu')\n",
|
| 257 |
+
" if custom_param:\n",
|
| 258 |
+
" assert not (dim_f is None or dim_t is None or n_fft is None or compensation is None), 'Custom parameter selected, but incomplete parameters are provided.'\n",
|
| 259 |
+
" mdx_model = mdx.MDX_Model(\n",
|
| 260 |
+
" device,\n",
|
| 261 |
+
" dim_f = dim_f,\n",
|
| 262 |
+
" dim_t = dim_t,\n",
|
| 263 |
+
" n_fft = n_fft,\n",
|
| 264 |
+
" stem_name=stem_name,\n",
|
| 265 |
+
" compensation=compensation\n",
|
| 266 |
+
" )\n",
|
| 267 |
+
" else:\n",
|
| 268 |
+
" model_hash = mdx.MDX.get_hash(onnx)\n",
|
| 269 |
+
" if model_hash in model_params:\n",
|
| 270 |
+
" mp = model_params.get(model_hash)\n",
|
| 271 |
+
" mdx_model = mdx.MDX_Model(\n",
|
| 272 |
+
" device,\n",
|
| 273 |
+
" dim_f = mp[\"mdx_dim_f_set\"],\n",
|
| 274 |
+
" dim_t = 2**mp[\"mdx_dim_t_set\"],\n",
|
| 275 |
+
" n_fft = mp[\"mdx_n_fft_scale_set\"],\n",
|
| 276 |
+
" stem_name=mp[\"primary_stem\"],\n",
|
| 277 |
+
" compensation=compensation if not custom_param and compensation is not None else mp[\"compensate\"]\n",
|
| 278 |
+
" )\n",
|
| 279 |
+
" return mdx_model\n",
|
| 280 |
+
"\n",
|
| 281 |
+
" def run_mdx(onnx, mdx_model,filename,diff=False,suffix=None,diff_suffix=None, denoise=False, m_threads=1):\n",
|
| 282 |
+
" mdx_sess = mdx.MDX(onnx,mdx_model)\n",
|
| 283 |
+
" print(f\"Processing: {filename}\")\n",
|
| 284 |
+
" wave, sr = librosa.load(filename,mono=False, sr=44100)\n",
|
| 285 |
+
" # normalizing input wave gives better output\n",
|
| 286 |
+
" peak = max(np.max(wave), abs(np.min(wave)))\n",
|
| 287 |
+
" wave /= peak\n",
|
| 288 |
+
" if denoise:\n",
|
| 289 |
+
" wave_processed = -(mdx_sess.process_wave(-wave, m_threads)) + (mdx_sess.process_wave(wave, m_threads))\n",
|
| 290 |
+
" wave_processed *= 0.5\n",
|
| 291 |
+
" else:\n",
|
| 292 |
+
" wave_processed = mdx_sess.process_wave(wave, m_threads)\n",
|
| 293 |
+
" # return to previous peak\n",
|
| 294 |
+
" wave_processed *= peak\n",
|
| 295 |
+
"\n",
|
| 296 |
+
" stem_name = mdx_model.stem_name if suffix is None else suffix # use suffix if provided\n",
|
| 297 |
+
" save_path = f\"{os.path.basename(os.path.splitext(filename)[0])}_{stem_name}.wav\"\n",
|
| 298 |
+
" save_path = os.path.join(\n",
|
| 299 |
+
" 'separated',\n",
|
| 300 |
+
" save_path\n",
|
| 301 |
+
" )\n",
|
| 302 |
+
" sf.write(\n",
|
| 303 |
+
" save_path,\n",
|
| 304 |
+
" wave_processed.T,\n",
|
| 305 |
+
" sr\n",
|
| 306 |
+
" )\n",
|
| 307 |
+
"\n",
|
| 308 |
+
" print(f'done, saved to: {save_path}')\n",
|
| 309 |
+
"\n",
|
| 310 |
+
" if diff:\n",
|
| 311 |
+
" diff_stem_name = stem_naming.get(stem_name) if diff_suffix is None else diff_suffix # use suffix if provided\n",
|
| 312 |
+
" stem_name = f\"{stem_name}_diff\" if diff_stem_name is None else diff_stem_name\n",
|
| 313 |
+
" save_path = f\"{os.path.basename(os.path.splitext(filename)[0])}_{stem_name}.wav\"\n",
|
| 314 |
+
" save_path = os.path.join(\n",
|
| 315 |
+
" 'separated',\n",
|
| 316 |
+
" save_path\n",
|
| 317 |
+
" )\n",
|
| 318 |
+
" sf.write(\n",
|
| 319 |
+
" save_path,\n",
|
| 320 |
+
" (-wave_processed.T*mdx_model.compensation)+wave.T,\n",
|
| 321 |
+
" sr\n",
|
| 322 |
+
" )\n",
|
| 323 |
+
" print(f'invert done, saved to: {save_path}')\n",
|
| 324 |
+
" del mdx_sess, wave_processed, wave\n",
|
| 325 |
+
" gc.collect()\n",
|
| 326 |
+
"\n",
|
| 327 |
+
" def is_valid_url(url):\n",
|
| 328 |
+
" import re\n",
|
| 329 |
+
" regex = re.compile(\n",
|
| 330 |
+
" r'^https?://'\n",
|
| 331 |
+
" r'(?:(?:[A-Z0-9](?:[A-Z0-9-]{0,61}[A-Z0-9])?\\.)+[A-Z]{2,6}\\.?|'\n",
|
| 332 |
+
" r'localhost|'\n",
|
| 333 |
+
" r'\\d{1,3}\\.\\d{1,3}\\.\\d{1,3}\\.\\d{1,3})'\n",
|
| 334 |
+
" r'(?::\\d+)?'\n",
|
| 335 |
+
" r'(?:/?|[/?]\\S+)$', re.IGNORECASE)\n",
|
| 336 |
+
" return url is not None and regex.search(url)\n",
|
| 337 |
+
"\n",
|
| 338 |
+
" def download_deezer(link, arl, fmt='FLAC'):\n",
|
| 339 |
+
" match fmt:\n",
|
| 340 |
+
" case 'FLAC':\n",
|
| 341 |
+
" bitrate = TrackFormats.FLAC\n",
|
| 342 |
+
" case 'MP3_320':\n",
|
| 343 |
+
" bitrate = TrackFormats.MP3_320\n",
|
| 344 |
+
" case 'MP3_128':\n",
|
| 345 |
+
" bitrate = TrackFormats.MP3_128\n",
|
| 346 |
+
" case _:\n",
|
| 347 |
+
" bitrate = TrackFormats.MP3_128\n",
|
| 348 |
+
"\n",
|
| 349 |
+
" dz = Deezer()\n",
|
| 350 |
+
" settings = loadSettings('dz_config')\n",
|
| 351 |
+
" settings['downloadLocation'] = './tracks'\n",
|
| 352 |
+
" if not dz.login_via_arl(arl.strip()):\n",
|
| 353 |
+
" raise Exception('Error while logging in with provided ARL.')\n",
|
| 354 |
+
" downloadObject = generateDownloadObject(dz, link, bitrate)\n",
|
| 355 |
+
" print(f'Downloading {downloadObject.type}: \"{downloadObject.title}\" by {downloadObject.artist}...',end=' ',flush=True)\n",
|
| 356 |
+
" Downloader(dz, downloadObject, settings).start()\n",
|
| 357 |
+
" print(f'done.')\n",
|
| 358 |
+
"\n",
|
| 359 |
+
" path_to_audio = []\n",
|
| 360 |
+
" for file in downloadObject.files:\n",
|
| 361 |
+
" path_to_audio.append(file[\"path\"])\n",
|
| 362 |
+
"\n",
|
| 363 |
+
" return path_to_audio\n",
|
| 364 |
+
"\n",
|
| 365 |
+
" def download_link(url):\n",
|
| 366 |
+
" ydl_opts = {\n",
|
| 367 |
+
" 'format': 'bestvideo+bestaudio/best',\n",
|
| 368 |
+
" 'outtmpl': '%(title)s.%(ext)s',\n",
|
| 369 |
+
" 'nocheckcertificate': True,\n",
|
| 370 |
+
" 'ignoreerrors': True,\n",
|
| 371 |
+
" 'no_warnings': True,\n",
|
| 372 |
+
" 'extractaudio': True,\n",
|
| 373 |
+
" }\n",
|
| 374 |
+
" with yt_dlp.YoutubeDL(ydl_opts) as ydl:\n",
|
| 375 |
+
" result = ydl.extract_info(url, download=True)\n",
|
| 376 |
+
" download_path = ydl.prepare_filename(result)\n",
|
| 377 |
+
" return download_path\n",
|
| 378 |
+
"\n",
|
| 379 |
+
" print('finished setting up!')\n",
|
| 380 |
+
" first_cell_ran = True"
|
| 381 |
+
]
|
| 382 |
+
},
|
| 383 |
+
{
|
| 384 |
+
"cell_type": "code",
|
| 385 |
+
"execution_count": null,
|
| 386 |
+
"metadata": {
|
| 387 |
+
"id": "4hd1TzEGCiRo",
|
| 388 |
+
"cellView": "form"
|
| 389 |
+
},
|
| 390 |
+
"outputs": [],
|
| 391 |
+
"source": [
|
| 392 |
+
"if 'first_cell_ran' in locals():\n",
|
| 393 |
+
" os.chdir(mounting_path + '/' + file_folder + '/')\n",
|
| 394 |
+
" #parameter markdowns-----------------\n",
|
| 395 |
+
" #@markdown ### Input files\n",
|
| 396 |
+
" #@markdown Track filename: Upload your songs to the \"tracks\" folder (by default in MyDrive\\Colab-for-MDX_B\\). <br>You may provide multiple links/files by spliting them with ; <br>Or you can paste direct file path from file manager on the left.\n",
|
| 397 |
+
" filename = \"https://deezer.com/album/281108671\" #@param {type:\"string\"}\n",
|
| 398 |
+
" #@markdown onnx model (if you have your own model, upload it in models folder)\n",
|
| 399 |
+
" onnx = \"UVR-MDX-NET-Inst_HQ_5.onnx\" #@param [\"Kim_Inst.onnx\", \"Kim_Vocal_1.onnx\", \"Kim_Vocal_2.onnx\", \"kuielab_a_bass.onnx\", \"kuielab_a_drums.onnx\", \"kuielab_a_other.onnx\", \"kuielab_a_vocals.onnx\", \"kuielab_b_bass.onnx\", \"kuielab_b_drums.onnx\", \"kuielab_b_other.onnx\", \"kuielab_b_vocals.onnx\", \"Reverb_HQ_By_FoxJoy.onnx\", \"UVR-MDX-NET-Inst_1.onnx\", \"UVR-MDX-NET-Inst_2.onnx\", \"UVR-MDX-NET-Inst_3.onnx\", \"UVR-MDX-NET-Inst_HQ_1.onnx\", \"UVR-MDX-NET-Inst_HQ_2.onnx\", \"UVR-MDX-NET-Inst_Main.onnx\", \"UVR_MDXNET_1_9703.onnx\", \"UVR_MDXNET_2_9682.onnx\", \"UVR_MDXNET_3_9662.onnx\", \"UVR_MDXNET_9482.onnx\", \"UVR_MDXNET_KARA.onnx\", \"UVR_MDXNET_KARA_2.onnx\", \"UVR_MDXNET_Main.onnx\", \"UVR-MDX-NET-Inst_HQ_3.onnx\", \"UVR-MDX-NET-Inst_HQ_4.onnx\", \"UVR-MDX-NET-Inst_HQ_5.onnx\", \"UVR-MDX-NET-Voc_FT.onnx\", \"UVR-MDX-NET_Crowd_HQ_1.onnx\"]{allow-input: true}\n",
|
| 400 |
+
" #@markdown process all: processes all tracks inside tracks/ folder instead. (filename will be ignored!)\n",
|
| 401 |
+
" process_all = False # @param{type:\"boolean\"}\n",
|
| 402 |
+
"\n",
|
| 403 |
+
"\n",
|
| 404 |
+
" #@markdown ### Settings\n",
|
| 405 |
+
" #@markdown invert: get difference between input and output (e.g get Instrumental out of Vocal model or in reverse)\n",
|
| 406 |
+
" invert = True # @param{type:\"boolean\"}\n",
|
| 407 |
+
" #@markdown denoise: get rid of MDX noise. (This processes input track twice)\n",
|
| 408 |
+
" denoise = True # @param{type:\"boolean\"}\n",
|
| 409 |
+
" #@markdown m_threads: like batch size, processes input wave in n threads. (beneficial for CPU)\n",
|
| 410 |
+
" m_threads = 2 #@param {type:\"slider\", min:1, max:8, step:1}\n",
|
| 411 |
+
"\n",
|
| 412 |
+
" #@markdown ### Custom model parameters (Only use this if you're using new/unofficial/custom models)\n",
|
| 413 |
+
" #@markdown Use custom model parameters. (Default: unchecked, or auto)\n",
|
| 414 |
+
" use_custom_parameter = False # @param{type:\"boolean\"}\n",
|
| 415 |
+
" #@markdown Output file suffix (usually the stem name e.g Vocals)\n",
|
| 416 |
+
" suffix = \"Vocals_custom\" #@param [\"Vocals\", \"Drums\", \"Bass\", \"Other\"]{allow-input: true}\n",
|
| 417 |
+
" suffix_invert = \"Instrumental_custom\" #@param [\"Instrumental\", \"Drumless\", \"Bassless\", \"Instruments\"]{allow-input: true}\n",
|
| 418 |
+
" #@markdown Model parameters\n",
|
| 419 |
+
" dim_f = 3072 #@param {type: \"integer\"}\n",
|
| 420 |
+
" dim_t = 256 #@param {type: \"integer\"}\n",
|
| 421 |
+
" n_fft = 6144 #@param {type: \"integer\"}\n",
|
| 422 |
+
" #@markdown use custom compensation: only if you have your own compensation value for your model. this still apply even if you don't have use_custom_parameter checked (Default: unchecked, or auto)\n",
|
| 423 |
+
" use_custom_compensation = False # @param{type:\"boolean\"}\n",
|
| 424 |
+
" compensation = 1.000 #@param {type: \"number\"}\n",
|
| 425 |
+
"\n",
|
| 426 |
+
" #@markdown ### Extras\n",
|
| 427 |
+
" #@markdown Deezer arl: paste your ARL here for Deezer tracks directly!\n",
|
| 428 |
+
" arl = \"\" #@param {type:\"string\"}\n",
|
| 429 |
+
" #@markdown Track format: select track quality/format\n",
|
| 430 |
+
" track_format = \"FLAC\" #@param [\"FLAC\",\"MP3_320\",\"MP3_128\"]\n",
|
| 431 |
+
" #@markdown Print settings being used in the run\n",
|
| 432 |
+
" print_settings = True # @param{type:\"boolean\"}\n",
|
| 433 |
+
"\n",
|
| 434 |
+
"\n",
|
| 435 |
+
"\n",
|
| 436 |
+
" onnx = id_to_ptm(onnx)\n",
|
| 437 |
+
" compensation = compensation if use_custom_compensation or use_custom_parameter else None\n",
|
| 438 |
+
" mdx_model = prepare_mdx(use_custom_parameter, dim_f, dim_t, n_fft, compensation=compensation)\n",
|
| 439 |
+
"\n",
|
| 440 |
+
" filename_split = filename.split(';')\n",
|
| 441 |
+
"\n",
|
| 442 |
+
" usable_files = []\n",
|
| 443 |
+
"\n",
|
| 444 |
+
" if not process_all:\n",
|
| 445 |
+
" for fn in filename_split:\n",
|
| 446 |
+
" fn = fn.strip()\n",
|
| 447 |
+
" if is_valid_url(fn):\n",
|
| 448 |
+
" dm, ltype, lid = deemix.parseLink(fn)\n",
|
| 449 |
+
" if ltype and lid:\n",
|
| 450 |
+
" usable_files += download_deezer(fn, arl, track_format)\n",
|
| 451 |
+
" else:\n",
|
| 452 |
+
" print('downloading link...',end=' ')\n",
|
| 453 |
+
" usable_files+=[download_link(fn)]\n",
|
| 454 |
+
" print('done')\n",
|
| 455 |
+
" else:\n",
|
| 456 |
+
" usable_files.append(os.path.join('tracks',fn))\n",
|
| 457 |
+
" else:\n",
|
| 458 |
+
" for fn in glob.glob('tracks/*'):\n",
|
| 459 |
+
" usable_files.append(fn)\n",
|
| 460 |
+
" for filename in usable_files:\n",
|
| 461 |
+
" suffix_naming = suffix if use_custom_parameter else None\n",
|
| 462 |
+
" diff_suffix_naming = suffix_invert if use_custom_parameter else None\n",
|
| 463 |
+
" run_mdx(onnx, mdx_model, filename, diff=invert,suffix=suffix_naming,diff_suffix=diff_suffix_naming,denoise=denoise)\n",
|
| 464 |
+
"\n",
|
| 465 |
+
" if print_settings:\n",
|
| 466 |
+
" print()\n",
|
| 467 |
+
" print('[MDX-Net_Colab settings used]')\n",
|
| 468 |
+
" print(f'Model used: {onnx}')\n",
|
| 469 |
+
" print(f'Model MD5: {mdx.MDX.get_hash(onnx)}')\n",
|
| 470 |
+
" print(f'Using de-noise: {denoise}')\n",
|
| 471 |
+
" print(f'Model parameters:')\n",
|
| 472 |
+
" print(f' -dim_f: {mdx_model.dim_f}')\n",
|
| 473 |
+
" print(f' -dim_t: {mdx_model.dim_t}')\n",
|
| 474 |
+
" print(f' -n_fft: {mdx_model.n_fft}')\n",
|
| 475 |
+
" print(f' -compensation: {mdx_model.compensation}')\n",
|
| 476 |
+
" print()\n",
|
| 477 |
+
" print('[Input file]')\n",
|
| 478 |
+
" print('filename(s): ')\n",
|
| 479 |
+
" for filename in usable_files:\n",
|
| 480 |
+
" print(f' -{filename}')\n",
|
| 481 |
+
"\n",
|
| 482 |
+
" del mdx_model"
|
| 483 |
+
]
|
| 484 |
+
},
|
| 485 |
+
{
|
| 486 |
+
"cell_type": "markdown",
|
| 487 |
+
"metadata": {
|
| 488 |
+
"id": "tMVwX5RhZSRP"
|
| 489 |
+
},
|
| 490 |
+
"source": [
|
| 491 |
+
"# Guide\n",
|
| 492 |
+
"\n",
|
| 493 |
+
"This tutorial guide will walk you through the steps to use the features of this Colab notebook.\n",
|
| 494 |
+
"\n",
|
| 495 |
+
"## Mount Drive\n",
|
| 496 |
+
"\n",
|
| 497 |
+
"To mount your Google Drive, follow these steps:\n",
|
| 498 |
+
"\n",
|
| 499 |
+
"1. Check the box next to \"MountDrive\" if you want to mount Google Drive.\n",
|
| 500 |
+
"2. Modify the \"mounting_path\" if you want to specify a different path for the drive to be mounted. **Note:** Be cautious when modifying this path as it can cause issues if not done properly.\n",
|
| 501 |
+
"3. Check the box next to \"Force update and disregard local changes\" if you want to discard all local modifications in your repository and replace the files with the versions from the original commit.\n",
|
| 502 |
+
"4. Check the box next to \"Auto Update\" if you want to automatically update without discarding your changes. Leave it unchecked if you want to manually update.\n",
|
| 503 |
+
"\n",
|
| 504 |
+
"## Input Files\n",
|
| 505 |
+
"\n",
|
| 506 |
+
"To upload your songs, follow these steps:\n",
|
| 507 |
+
"\n",
|
| 508 |
+
"1. Specify the \"track filename\" for your songs. You can provide multiple links or files by separating them with a semicolon (;).\n",
|
| 509 |
+
"2. Upload your songs to the \"tracks\" folder.\n",
|
| 510 |
+
"\n",
|
| 511 |
+
"## ONNX Model\n",
|
| 512 |
+
"\n",
|
| 513 |
+
"If you have your own ONNX model, follow these steps:\n",
|
| 514 |
+
"\n",
|
| 515 |
+
"1. Upload your model to the \"models\" folder.\n",
|
| 516 |
+
"2. Specify the \"onnx\" filename for your model.\n",
|
| 517 |
+
"\n",
|
| 518 |
+
"## Processing\n",
|
| 519 |
+
"\n",
|
| 520 |
+
"To process your tracks, follow these steps:\n",
|
| 521 |
+
"\n",
|
| 522 |
+
"1. If you want to process all tracks inside the \"tracks\" folder, check the box next to \"process_all\" and ignore the \"filename\" field.\n",
|
| 523 |
+
"2. Specify any additional settings you want:\n",
|
| 524 |
+
" - Check the box next to \"invert\" to get the difference between input and output (e.g., get Instrumental out of Vocals).\n",
|
| 525 |
+
" - Check the box next to \"denoise\" to get rid of MDX noise. This processes the input track twice.\n",
|
| 526 |
+
" - Specify custom model parameters only if you're using new/unofficial/custom models. Use the \"use_custom_parameter\" checkbox to enable this feature.\n",
|
| 527 |
+
" - Specify the output file suffix, which is usually the stem name (e.g., Vocals). Use the \"suffix\" field to specify the suffix for normal processing and the \"suffix_invert\" field for inverted processing.\n",
|
| 528 |
+
"\n",
|
| 529 |
+
"## Model Parameters\n",
|
| 530 |
+
"\n",
|
| 531 |
+
"Specify the following custom model parameters if applicable:\n",
|
| 532 |
+
"\n",
|
| 533 |
+
"- \"dim_f\": The value for the `dim_f` parameter.\n",
|
| 534 |
+
"- \"dim_t\": The value for the `dim_t` parameter.\n",
|
| 535 |
+
"- \"n_fft\": The value for the `n_fft` parameter.\n",
|
| 536 |
+
"- Check the box next to \"use_custom_compensation\" if you have your own compensation value for your model. Specify the compensation value in the \"compensation\" field.\n",
|
| 537 |
+
"\n",
|
| 538 |
+
"## Extras\n",
|
| 539 |
+
"\n",
|
| 540 |
+
"If you're working with Deezer tracks, paste your ARL (Authentication Request Library) in the \"arl\" field to directly access the tracks.\n",
|
| 541 |
+
"\n",
|
| 542 |
+
"Specify the \"Track format\" by selecting the desired quality/format for the track.\n",
|
| 543 |
+
"\n",
|
| 544 |
+
"To print the settings being used in the run, check the box next to \"print_settings\".\n",
|
| 545 |
+
"\n",
|
| 546 |
+
"That's it! You're now ready to use this Colab notebook. Enjoy!\n",
|
| 547 |
+
"\n",
|
| 548 |
+
"## For more detailed guide, proceed to this <a href=\"https://docs.google.com/document/d/17fjNvJzj8ZGSer7c7OFe_CNfUKbAxEh_OBv94ZdRG5c\">link</a>.\n",
|
| 549 |
+
"credits: (discord) deton24"
|
| 550 |
+
]
|
| 551 |
+
}
|
| 552 |
+
],
|
| 553 |
+
"metadata": {
|
| 554 |
+
"accelerator": "GPU",
|
| 555 |
+
"colab": {
|
| 556 |
+
"gpuType": "T4",
|
| 557 |
+
"provenance": []
|
| 558 |
+
},
|
| 559 |
+
"kernelspec": {
|
| 560 |
+
"display_name": "Python 3",
|
| 561 |
+
"name": "python3"
|
| 562 |
+
},
|
| 563 |
+
"language_info": {
|
| 564 |
+
"name": "python"
|
| 565 |
+
}
|
| 566 |
+
},
|
| 567 |
+
"nbformat": 4,
|
| 568 |
+
"nbformat_minor": 0
|
| 569 |
+
}
|
models/MDXCENTRE/.gitattributes
ADDED
|
@@ -0,0 +1,35 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
*.7z filter=lfs diff=lfs merge=lfs -text
|
| 2 |
+
*.arrow filter=lfs diff=lfs merge=lfs -text
|
| 3 |
+
*.bin filter=lfs diff=lfs merge=lfs -text
|
| 4 |
+
*.bz2 filter=lfs diff=lfs merge=lfs -text
|
| 5 |
+
*.ckpt filter=lfs diff=lfs merge=lfs -text
|
| 6 |
+
*.ftz filter=lfs diff=lfs merge=lfs -text
|
| 7 |
+
*.gz filter=lfs diff=lfs merge=lfs -text
|
| 8 |
+
*.h5 filter=lfs diff=lfs merge=lfs -text
|
| 9 |
+
*.joblib filter=lfs diff=lfs merge=lfs -text
|
| 10 |
+
*.lfs.* filter=lfs diff=lfs merge=lfs -text
|
| 11 |
+
*.mlmodel filter=lfs diff=lfs merge=lfs -text
|
| 12 |
+
*.model filter=lfs diff=lfs merge=lfs -text
|
| 13 |
+
*.msgpack filter=lfs diff=lfs merge=lfs -text
|
| 14 |
+
*.npy filter=lfs diff=lfs merge=lfs -text
|
| 15 |
+
*.npz filter=lfs diff=lfs merge=lfs -text
|
| 16 |
+
*.onnx filter=lfs diff=lfs merge=lfs -text
|
| 17 |
+
*.ot filter=lfs diff=lfs merge=lfs -text
|
| 18 |
+
*.parquet filter=lfs diff=lfs merge=lfs -text
|
| 19 |
+
*.pb filter=lfs diff=lfs merge=lfs -text
|
| 20 |
+
*.pickle filter=lfs diff=lfs merge=lfs -text
|
| 21 |
+
*.pkl filter=lfs diff=lfs merge=lfs -text
|
| 22 |
+
*.pt filter=lfs diff=lfs merge=lfs -text
|
| 23 |
+
*.pth filter=lfs diff=lfs merge=lfs -text
|
| 24 |
+
*.rar filter=lfs diff=lfs merge=lfs -text
|
| 25 |
+
*.safetensors filter=lfs diff=lfs merge=lfs -text
|
| 26 |
+
saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
| 27 |
+
*.tar.* filter=lfs diff=lfs merge=lfs -text
|
| 28 |
+
*.tar filter=lfs diff=lfs merge=lfs -text
|
| 29 |
+
*.tflite filter=lfs diff=lfs merge=lfs -text
|
| 30 |
+
*.tgz filter=lfs diff=lfs merge=lfs -text
|
| 31 |
+
*.wasm filter=lfs diff=lfs merge=lfs -text
|
| 32 |
+
*.xz filter=lfs diff=lfs merge=lfs -text
|
| 33 |
+
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
+
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
+
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
models/MDXCENTRE/config_mdx23c_similarity.yaml
ADDED
|
@@ -0,0 +1,89 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
audio:
|
| 2 |
+
chunk_size: 130560
|
| 3 |
+
dim_f: 1024
|
| 4 |
+
dim_t: 256
|
| 5 |
+
hop_length: 512
|
| 6 |
+
n_fft: 2048
|
| 7 |
+
num_channels: 2
|
| 8 |
+
sample_rate: 44100
|
| 9 |
+
min_mean_abs: 0.001
|
| 10 |
+
|
| 11 |
+
model:
|
| 12 |
+
act: gelu
|
| 13 |
+
bottleneck_factor: 4
|
| 14 |
+
growth: 128
|
| 15 |
+
norm: InstanceNorm
|
| 16 |
+
num_blocks_per_scale: 2
|
| 17 |
+
num_channels: 128
|
| 18 |
+
num_scales: 5
|
| 19 |
+
num_subbands: 4
|
| 20 |
+
scale:
|
| 21 |
+
- 2
|
| 22 |
+
- 2
|
| 23 |
+
|
| 24 |
+
training:
|
| 25 |
+
batch_size: 2
|
| 26 |
+
gradient_accumulation_steps: 3
|
| 27 |
+
grad_clip: 0
|
| 28 |
+
instruments:
|
| 29 |
+
- similarity
|
| 30 |
+
- difference
|
| 31 |
+
lr: 1.0
|
| 32 |
+
patience: 15
|
| 33 |
+
reduce_factor: 0.95
|
| 34 |
+
target_instrument: similarity
|
| 35 |
+
num_epochs: 1000
|
| 36 |
+
num_steps: 2235
|
| 37 |
+
q: 0.95
|
| 38 |
+
coarse_loss_clip: true
|
| 39 |
+
ema_momentum: 0.999
|
| 40 |
+
optimizer: prodigy
|
| 41 |
+
other_fix: false # it's needed for checking on multisong dataset if other is actually instrumental
|
| 42 |
+
use_amp: true # enable or disable usage of mixed precision (float16) - usually it must be true
|
| 43 |
+
|
| 44 |
+
augmentations:
|
| 45 |
+
enable: true # enable or disable all augmentations (to fast disable if needed)
|
| 46 |
+
loudness: true # randomly change loudness of each stem on the range (loudness_min; loudness_max)
|
| 47 |
+
loudness_min: 0.5
|
| 48 |
+
loudness_max: 1.5
|
| 49 |
+
|
| 50 |
+
all:
|
| 51 |
+
channel_shuffle: 0.5 # Set 0 or lower to disable
|
| 52 |
+
random_inverse: 0.01 # inverse track (better lower probability)
|
| 53 |
+
random_polarity: 0.5 # polarity change (multiply waveform to -1)
|
| 54 |
+
mp3_compression: 0.0
|
| 55 |
+
mp3_compression_min_bitrate: 32
|
| 56 |
+
mp3_compression_max_bitrate: 320
|
| 57 |
+
mp3_compression_backend: "lameenc"
|
| 58 |
+
pitch_shift: 0.1
|
| 59 |
+
pitch_shift_min_semitones: -3
|
| 60 |
+
pitch_shift_max_semitones: 3
|
| 61 |
+
seven_band_parametric_eq: 0.5
|
| 62 |
+
seven_band_parametric_eq_min_gain_db: -6
|
| 63 |
+
seven_band_parametric_eq_max_gain_db: 6
|
| 64 |
+
tanh_distortion: 0.2
|
| 65 |
+
tanh_distortion_min: 0.1
|
| 66 |
+
tanh_distortion_max: 0.5
|
| 67 |
+
|
| 68 |
+
similarity:
|
| 69 |
+
gaussian_noise: 0.1
|
| 70 |
+
gaussian_noise_min_amplitude: 0.001
|
| 71 |
+
gaussian_noise_max_amplitude: 0.015
|
| 72 |
+
|
| 73 |
+
difference:
|
| 74 |
+
pedalboard_reverb: 0.01
|
| 75 |
+
pedalboard_reverb_room_size_min: 0.1
|
| 76 |
+
pedalboard_reverb_room_size_max: 0.9
|
| 77 |
+
pedalboard_reverb_damping_min: 0.1
|
| 78 |
+
pedalboard_reverb_damping_max: 0.9
|
| 79 |
+
pedalboard_reverb_wet_level_min: 0.1
|
| 80 |
+
pedalboard_reverb_wet_level_max: 0.5
|
| 81 |
+
pedalboard_reverb_dry_level_min: 0.5
|
| 82 |
+
pedalboard_reverb_dry_level_max: 0.9
|
| 83 |
+
pedalboard_reverb_width_min: 0.3
|
| 84 |
+
pedalboard_reverb_width_max: 1.0
|
| 85 |
+
|
| 86 |
+
inference:
|
| 87 |
+
batch_size: 1
|
| 88 |
+
dim_t: 256
|
| 89 |
+
num_overlap: 8
|
models/MDXCENTRE/model_mdx23c_ep_237_l1_freq_71.9982.ckpt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:bf55a7b0f9cc802a560bd18c604ead29f778cc804867faa1cf92bb0f7a877fa4
|
| 3 |
+
size 437613512
|
models/MDXCENTRE/source.txt
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
https://huggingface.co/thexstyx/MDXCENTRE
|
models/UVR5-MDX-NET-VIP-MODELS/.gitattributes
ADDED
|
@@ -0,0 +1,35 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
*.7z filter=lfs diff=lfs merge=lfs -text
|
| 2 |
+
*.arrow filter=lfs diff=lfs merge=lfs -text
|
| 3 |
+
*.bin filter=lfs diff=lfs merge=lfs -text
|
| 4 |
+
*.bz2 filter=lfs diff=lfs merge=lfs -text
|
| 5 |
+
*.ckpt filter=lfs diff=lfs merge=lfs -text
|
| 6 |
+
*.ftz filter=lfs diff=lfs merge=lfs -text
|
| 7 |
+
*.gz filter=lfs diff=lfs merge=lfs -text
|
| 8 |
+
*.h5 filter=lfs diff=lfs merge=lfs -text
|
| 9 |
+
*.joblib filter=lfs diff=lfs merge=lfs -text
|
| 10 |
+
*.lfs.* filter=lfs diff=lfs merge=lfs -text
|
| 11 |
+
*.mlmodel filter=lfs diff=lfs merge=lfs -text
|
| 12 |
+
*.model filter=lfs diff=lfs merge=lfs -text
|
| 13 |
+
*.msgpack filter=lfs diff=lfs merge=lfs -text
|
| 14 |
+
*.npy filter=lfs diff=lfs merge=lfs -text
|
| 15 |
+
*.npz filter=lfs diff=lfs merge=lfs -text
|
| 16 |
+
*.onnx filter=lfs diff=lfs merge=lfs -text
|
| 17 |
+
*.ot filter=lfs diff=lfs merge=lfs -text
|
| 18 |
+
*.parquet filter=lfs diff=lfs merge=lfs -text
|
| 19 |
+
*.pb filter=lfs diff=lfs merge=lfs -text
|
| 20 |
+
*.pickle filter=lfs diff=lfs merge=lfs -text
|
| 21 |
+
*.pkl filter=lfs diff=lfs merge=lfs -text
|
| 22 |
+
*.pt filter=lfs diff=lfs merge=lfs -text
|
| 23 |
+
*.pth filter=lfs diff=lfs merge=lfs -text
|
| 24 |
+
*.rar filter=lfs diff=lfs merge=lfs -text
|
| 25 |
+
*.safetensors filter=lfs diff=lfs merge=lfs -text
|
| 26 |
+
saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
| 27 |
+
*.tar.* filter=lfs diff=lfs merge=lfs -text
|
| 28 |
+
*.tar filter=lfs diff=lfs merge=lfs -text
|
| 29 |
+
*.tflite filter=lfs diff=lfs merge=lfs -text
|
| 30 |
+
*.tgz filter=lfs diff=lfs merge=lfs -text
|
| 31 |
+
*.wasm filter=lfs diff=lfs merge=lfs -text
|
| 32 |
+
*.xz filter=lfs diff=lfs merge=lfs -text
|
| 33 |
+
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
+
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
+
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
models/UVR5-MDX-NET-VIP-MODELS/MDX23C-8KFFT-InstVoc_HQ_2.ckpt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7d960d8e40a458120412c1bd807e013d2dbca7b959cc9da2bbcb0eb203d1daea
|
| 3 |
+
size 448093770
|
models/UVR5-MDX-NET-VIP-MODELS/README.md
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
---
|
| 2 |
+
license: openrail
|
| 3 |
+
---
|
models/UVR5-MDX-NET-VIP-MODELS/UVR-MDX-NET-Inst_full_292.onnx
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:020f6b65fa219fb7c285e4f3fc2863bf22daf03c4c93e547b6d13d5f2757a7ec
|
| 3 |
+
size 66759214
|
models/UVR5-MDX-NET-VIP-MODELS/UVR-MDX-NET_Inst_187_beta.onnx
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c74566f3c3033cacba996328b2ee90bf77ef79ea6c35b7841df183b7906f54a5
|
| 3 |
+
size 66759214
|
models/UVR5-MDX-NET-VIP-MODELS/UVR-MDX-NET_Inst_82_beta.onnx
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c6c268302f09ab53687072618e056a611272a7e2c3fd9b3b59164da152f3588e
|
| 3 |
+
size 66759214
|
models/UVR5-MDX-NET-VIP-MODELS/UVR-MDX-NET_Inst_90_beta.onnx
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0d902868a46575aea6ee2335736ff3b53faf497a6bdaa1b864e0fd84eb1b42a5
|
| 3 |
+
size 66759214
|
models/UVR5-MDX-NET-VIP-MODELS/UVR-MDX-NET_Main_340.onnx
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:78792633b4007755af12ecde20f709b4f0b99563b1d25fe0a501ed2122aff218
|
| 3 |
+
size 66759214
|
models/UVR5-MDX-NET-VIP-MODELS/UVR-MDX-NET_Main_390.onnx
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:286c4f0847ca837e2c3f4c4058f756d5f150cbf080506aa6f33a2847aba92e8c
|
| 3 |
+
size 66759214
|
models/UVR5-MDX-NET-VIP-MODELS/UVR-MDX-NET_Main_406.onnx
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f158816a44eef1f0ba0f48b813cbfcf460ed1c70a754af3609ade44aaf7d1b23
|
| 3 |
+
size 66759214
|
models/UVR5-MDX-NET-VIP-MODELS/UVR-MDX-NET_Main_427.onnx
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:95275802a27801b97e3c0552b6eaa69f9bb3bd7df53cdf0536cce0a753f702cc
|
| 3 |
+
size 66759214
|
models/UVR5-MDX-NET-VIP-MODELS/UVR-MDX-NET_Main_438.onnx
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d5e1ad93587a163a0987a0168b99a2ad875c0d9bfc3afb596b7c36b09c7f5c26
|
| 3 |
+
size 66759214
|
models/UVR5-MDX-NET-VIP-MODELS/source.txt
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
https://huggingface.co/Eddycrack864/UVR5-MDX-NET-VIP-MODELS
|
models/aufr33_jarredou_MDXv3_DeReverb/.gitattributes
ADDED
|
@@ -0,0 +1,35 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
*.7z filter=lfs diff=lfs merge=lfs -text
|
| 2 |
+
*.arrow filter=lfs diff=lfs merge=lfs -text
|
| 3 |
+
*.bin filter=lfs diff=lfs merge=lfs -text
|
| 4 |
+
*.bz2 filter=lfs diff=lfs merge=lfs -text
|
| 5 |
+
*.ckpt filter=lfs diff=lfs merge=lfs -text
|
| 6 |
+
*.ftz filter=lfs diff=lfs merge=lfs -text
|
| 7 |
+
*.gz filter=lfs diff=lfs merge=lfs -text
|
| 8 |
+
*.h5 filter=lfs diff=lfs merge=lfs -text
|
| 9 |
+
*.joblib filter=lfs diff=lfs merge=lfs -text
|
| 10 |
+
*.lfs.* filter=lfs diff=lfs merge=lfs -text
|
| 11 |
+
*.mlmodel filter=lfs diff=lfs merge=lfs -text
|
| 12 |
+
*.model filter=lfs diff=lfs merge=lfs -text
|
| 13 |
+
*.msgpack filter=lfs diff=lfs merge=lfs -text
|
| 14 |
+
*.npy filter=lfs diff=lfs merge=lfs -text
|
| 15 |
+
*.npz filter=lfs diff=lfs merge=lfs -text
|
| 16 |
+
*.onnx filter=lfs diff=lfs merge=lfs -text
|
| 17 |
+
*.ot filter=lfs diff=lfs merge=lfs -text
|
| 18 |
+
*.parquet filter=lfs diff=lfs merge=lfs -text
|
| 19 |
+
*.pb filter=lfs diff=lfs merge=lfs -text
|
| 20 |
+
*.pickle filter=lfs diff=lfs merge=lfs -text
|
| 21 |
+
*.pkl filter=lfs diff=lfs merge=lfs -text
|
| 22 |
+
*.pt filter=lfs diff=lfs merge=lfs -text
|
| 23 |
+
*.pth filter=lfs diff=lfs merge=lfs -text
|
| 24 |
+
*.rar filter=lfs diff=lfs merge=lfs -text
|
| 25 |
+
*.safetensors filter=lfs diff=lfs merge=lfs -text
|
| 26 |
+
saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
| 27 |
+
*.tar.* filter=lfs diff=lfs merge=lfs -text
|
| 28 |
+
*.tar filter=lfs diff=lfs merge=lfs -text
|
| 29 |
+
*.tflite filter=lfs diff=lfs merge=lfs -text
|
| 30 |
+
*.tgz filter=lfs diff=lfs merge=lfs -text
|
| 31 |
+
*.wasm filter=lfs diff=lfs merge=lfs -text
|
| 32 |
+
*.xz filter=lfs diff=lfs merge=lfs -text
|
| 33 |
+
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
+
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
+
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
models/aufr33_jarredou_MDXv3_DeReverb/config_dereverb_mdx23c.yaml
ADDED
|
@@ -0,0 +1,135 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
audio:
|
| 2 |
+
chunk_size: 261120
|
| 3 |
+
dim_f: 4096
|
| 4 |
+
dim_t: 256
|
| 5 |
+
hop_length: 1024
|
| 6 |
+
n_fft: 8192
|
| 7 |
+
num_channels: 2
|
| 8 |
+
sample_rate: 44100
|
| 9 |
+
min_mean_abs: 0.001
|
| 10 |
+
|
| 11 |
+
model:
|
| 12 |
+
act: gelu
|
| 13 |
+
bottleneck_factor: 4
|
| 14 |
+
growth: 128
|
| 15 |
+
norm: InstanceNorm
|
| 16 |
+
num_blocks_per_scale: 2
|
| 17 |
+
num_channels: 128
|
| 18 |
+
num_scales: 5
|
| 19 |
+
num_subbands: 4
|
| 20 |
+
scale:
|
| 21 |
+
- 2
|
| 22 |
+
- 2
|
| 23 |
+
|
| 24 |
+
training:
|
| 25 |
+
batch_size: 2
|
| 26 |
+
gradient_accumulation_steps: 1
|
| 27 |
+
grad_clip: 0
|
| 28 |
+
instruments:
|
| 29 |
+
- dry
|
| 30 |
+
- other
|
| 31 |
+
lr: 1.0e-06
|
| 32 |
+
patience: 4
|
| 33 |
+
reduce_factor: 0.93
|
| 34 |
+
target_instrument: null
|
| 35 |
+
num_epochs: 40
|
| 36 |
+
num_steps: 1000
|
| 37 |
+
q: 0.95
|
| 38 |
+
coarse_loss_clip: true
|
| 39 |
+
ema_momentum: 0.999
|
| 40 |
+
optimizer: adamw
|
| 41 |
+
read_metadata_procs: 8 # Number of processes to use during metadata reading for dataset. Can speed up metadata generation
|
| 42 |
+
other_fix: false # it's needed for checking on multisong dataset if other is actually instrumental
|
| 43 |
+
use_amp: true # enable or disable usage of mixed precision (float16) - usually it must be true
|
| 44 |
+
|
| 45 |
+
augmentations:
|
| 46 |
+
enable: false # enable or disable all augmentations (to fast disable if needed)
|
| 47 |
+
loudness: true # randomly change loudness of each stem on the range (loudness_min; loudness_max)
|
| 48 |
+
loudness_min: 0.5
|
| 49 |
+
loudness_max: 1.5
|
| 50 |
+
mixup: true # mix several stems of same type with some probability (only works for dataset types: 1, 2, 3)
|
| 51 |
+
mixup_probs: !!python/tuple # 2 additional stems of the same type (1st with prob 0.2, 2nd with prob 0.02)
|
| 52 |
+
- 0.2
|
| 53 |
+
- 0.02
|
| 54 |
+
mixup_loudness_min: 0.5
|
| 55 |
+
mixup_loudness_max: 1.5
|
| 56 |
+
|
| 57 |
+
all:
|
| 58 |
+
channel_shuffle: 0.5 # Set 0 or lower to disable
|
| 59 |
+
random_inverse: 0.05 # inverse track (better lower probability)
|
| 60 |
+
random_polarity: 0.5 # polarity change (multiply waveform to -1)
|
| 61 |
+
|
| 62 |
+
# pedalboard chorus block
|
| 63 |
+
pedalboard_chorus: 0.001
|
| 64 |
+
pedalboard_chorus_rate_hz_min: 1.0
|
| 65 |
+
pedalboard_chorus_rate_hz_max: 7.0
|
| 66 |
+
pedalboard_chorus_depth_min: 0.25
|
| 67 |
+
pedalboard_chorus_depth_max: 0.95
|
| 68 |
+
pedalboard_chorus_centre_delay_ms_min: 3
|
| 69 |
+
pedalboard_chorus_centre_delay_ms_max: 10
|
| 70 |
+
pedalboard_chorus_feedback_min: 0.0
|
| 71 |
+
pedalboard_chorus_feedback_max: 0.01
|
| 72 |
+
pedalboard_chorus_mix_min: 0.1
|
| 73 |
+
pedalboard_chorus_mix_max: 0.9
|
| 74 |
+
|
| 75 |
+
# pedalboard phazer block
|
| 76 |
+
pedalboard_phazer: 0.001
|
| 77 |
+
pedalboard_phazer_rate_hz_min: 1.0
|
| 78 |
+
pedalboard_phazer_rate_hz_max: 10.0
|
| 79 |
+
pedalboard_phazer_depth_min: 0.25
|
| 80 |
+
pedalboard_phazer_depth_max: 0.95
|
| 81 |
+
pedalboard_phazer_centre_frequency_hz_min: 200
|
| 82 |
+
pedalboard_phazer_centre_frequency_hz_max: 12000
|
| 83 |
+
pedalboard_phazer_feedback_min: 0.0
|
| 84 |
+
pedalboard_phazer_feedback_max: 0.5
|
| 85 |
+
pedalboard_phazer_mix_min: 0.1
|
| 86 |
+
pedalboard_phazer_mix_max: 0.9
|
| 87 |
+
|
| 88 |
+
# pedalboard pitch shift block
|
| 89 |
+
pedalboard_pitch_shift: 0.01
|
| 90 |
+
pedalboard_pitch_shift_semitones_min: -7
|
| 91 |
+
pedalboard_pitch_shift_semitones_max: 7
|
| 92 |
+
|
| 93 |
+
# pedalboard resample block
|
| 94 |
+
pedalboard_resample: 0.001
|
| 95 |
+
pedalboard_resample_target_sample_rate_min: 4000
|
| 96 |
+
pedalboard_resample_target_sample_rate_max: 44100
|
| 97 |
+
|
| 98 |
+
mp3_compression_min_bitrate: 32
|
| 99 |
+
mp3_compression_max_bitrate: 320
|
| 100 |
+
mp3_compression_backend: "lameenc"
|
| 101 |
+
|
| 102 |
+
dry:
|
| 103 |
+
# pedalboard distortion block
|
| 104 |
+
pedalboard_distortion: 0.001
|
| 105 |
+
pedalboard_distortion_drive_db_min: 1.0
|
| 106 |
+
pedalboard_distortion_drive_db_max: 25.0
|
| 107 |
+
|
| 108 |
+
tanh_distortion: 0.05
|
| 109 |
+
tanh_distortion_min: 0.1
|
| 110 |
+
tanh_distortion_max: 0.7
|
| 111 |
+
# pedalboard bitcrash block
|
| 112 |
+
pedalboard_bitcrash: 0.005
|
| 113 |
+
pedalboard_bitcrash_bit_depth_min: 4
|
| 114 |
+
pedalboard_bitcrash_bit_depth_max: 16
|
| 115 |
+
|
| 116 |
+
seven_band_parametric_eq: 0.24
|
| 117 |
+
seven_band_parametric_eq_min_gain_db: -9
|
| 118 |
+
seven_band_parametric_eq_max_gain_db: 9
|
| 119 |
+
|
| 120 |
+
gaussian_noise: 0.005
|
| 121 |
+
gaussian_noise_min_amplitude: 0.001
|
| 122 |
+
gaussian_noise_max_amplitude: 0.01
|
| 123 |
+
|
| 124 |
+
time_stretch: 0.01
|
| 125 |
+
time_stretch_min_rate: 0.8
|
| 126 |
+
time_stretch_max_rate: 1.25
|
| 127 |
+
other:
|
| 128 |
+
seven_band_parametric_eq: 0.24
|
| 129 |
+
seven_band_parametric_eq_min_gain_db: -9
|
| 130 |
+
seven_band_parametric_eq_max_gain_db: 9
|
| 131 |
+
|
| 132 |
+
inference:
|
| 133 |
+
batch_size: 2
|
| 134 |
+
dim_t: 256
|
| 135 |
+
num_overlap: 4
|
models/aufr33_jarredou_MDXv3_DeReverb/dereverb_mdx23c_sdr_6.9096.ckpt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:eae2471b707758d74db38ac1b1d5800e12f57c4e9d1ebbb2faf004b8e086e914
|
| 3 |
+
size 448098867
|
models/aufr33_jarredou_MDXv3_DeReverb/source.txt
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
https://huggingface.co/jarredou/aufr33_jarredou_MDXv3_DeReverb
|
models/mdxnet/.gitattributes
ADDED
|
@@ -0,0 +1,35 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
*.7z filter=lfs diff=lfs merge=lfs -text
|
| 2 |
+
*.arrow filter=lfs diff=lfs merge=lfs -text
|
| 3 |
+
*.bin filter=lfs diff=lfs merge=lfs -text
|
| 4 |
+
*.bz2 filter=lfs diff=lfs merge=lfs -text
|
| 5 |
+
*.ckpt filter=lfs diff=lfs merge=lfs -text
|
| 6 |
+
*.ftz filter=lfs diff=lfs merge=lfs -text
|
| 7 |
+
*.gz filter=lfs diff=lfs merge=lfs -text
|
| 8 |
+
*.h5 filter=lfs diff=lfs merge=lfs -text
|
| 9 |
+
*.joblib filter=lfs diff=lfs merge=lfs -text
|
| 10 |
+
*.lfs.* filter=lfs diff=lfs merge=lfs -text
|
| 11 |
+
*.mlmodel filter=lfs diff=lfs merge=lfs -text
|
| 12 |
+
*.model filter=lfs diff=lfs merge=lfs -text
|
| 13 |
+
*.msgpack filter=lfs diff=lfs merge=lfs -text
|
| 14 |
+
*.npy filter=lfs diff=lfs merge=lfs -text
|
| 15 |
+
*.npz filter=lfs diff=lfs merge=lfs -text
|
| 16 |
+
*.onnx filter=lfs diff=lfs merge=lfs -text
|
| 17 |
+
*.ot filter=lfs diff=lfs merge=lfs -text
|
| 18 |
+
*.parquet filter=lfs diff=lfs merge=lfs -text
|
| 19 |
+
*.pb filter=lfs diff=lfs merge=lfs -text
|
| 20 |
+
*.pickle filter=lfs diff=lfs merge=lfs -text
|
| 21 |
+
*.pkl filter=lfs diff=lfs merge=lfs -text
|
| 22 |
+
*.pt filter=lfs diff=lfs merge=lfs -text
|
| 23 |
+
*.pth filter=lfs diff=lfs merge=lfs -text
|
| 24 |
+
*.rar filter=lfs diff=lfs merge=lfs -text
|
| 25 |
+
*.safetensors filter=lfs diff=lfs merge=lfs -text
|
| 26 |
+
saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
| 27 |
+
*.tar.* filter=lfs diff=lfs merge=lfs -text
|
| 28 |
+
*.tar filter=lfs diff=lfs merge=lfs -text
|
| 29 |
+
*.tflite filter=lfs diff=lfs merge=lfs -text
|
| 30 |
+
*.tgz filter=lfs diff=lfs merge=lfs -text
|
| 31 |
+
*.wasm filter=lfs diff=lfs merge=lfs -text
|
| 32 |
+
*.xz filter=lfs diff=lfs merge=lfs -text
|
| 33 |
+
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
+
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
+
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
models/mdxnet/README.md
ADDED
|
@@ -0,0 +1,8 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
---
|
| 2 |
+
license: mit
|
| 3 |
+
---
|
| 4 |
+
|
| 5 |
+
Sources:
|
| 6 |
+
1. originally trained by KUIELAB, KUIELAB-MDX-Net got the 2nd place on the Leaderboard A and the 3rd place on the Leaderboard B in the MDX-Challenge ISMIR 2021,MIT licence,[link](https://github.com/kuielab/mdx-net)
|
| 7 |
+
2. Used by Project ultimatevocalremovergui, MIT license, [link](https://github.com/Anjok07/ultimatevocalremovergui)
|
| 8 |
+
3. Used by Project Ultimate Vocal Remover CLI, [link](https://github.com/seanghay/uvr)
|
models/mdxnet/UVR-MDX-NET-Inst_HQ_3.onnx
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:317554b07fe1ea5279a77f2b1520a41ea4b93432560c4ffd08792c30fddf9adc
|
| 3 |
+
size 66759214
|
models/mdxnet/UVR-MDX-NET-Voc_FT.onnx
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:534b2070fcc7df514b13ef660dc8cbb328679c2374d04354a5c42bb14ecce111
|
| 3 |
+
size 66762490
|
models/mdxnet/UVR_MDXNET_KARA_2.onnx
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:bf32e15105a09c0f7dddd2b67346146334d6f3ecb399ed7638eba2ab07cbf5f4
|
| 3 |
+
size 52786726
|
models/mdxnet/model_data.json
ADDED
|
@@ -0,0 +1,50 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"77d07b2667ddf05b9e3175941b4454a0": {
|
| 3 |
+
"compensate": 1.021,
|
| 4 |
+
"mdx_dim_f_set": 3072,
|
| 5 |
+
"mdx_dim_t_set": 8,
|
| 6 |
+
"mdx_n_fft_scale_set": 7680,
|
| 7 |
+
"primary_stem": "Vocals",
|
| 8 |
+
"name": "UVR-MDX-NET-Voc_FT.onnx"
|
| 9 |
+
},
|
| 10 |
+
"1d64a6d2c30f709b8c9b4ce1366d96ee": {
|
| 11 |
+
"compensate": 1.035,
|
| 12 |
+
"mdx_dim_f_set": 2048,
|
| 13 |
+
"mdx_dim_t_set": 8,
|
| 14 |
+
"mdx_n_fft_scale_set": 5120,
|
| 15 |
+
"primary_stem": "Instrumental",
|
| 16 |
+
"name": "UVR_MDXNET_KARA_2.onnx"
|
| 17 |
+
},
|
| 18 |
+
"cd5b2989ad863f116c855db1dfe24e39": {
|
| 19 |
+
"compensate": 1.035,
|
| 20 |
+
"mdx_dim_f_set": 3072,
|
| 21 |
+
"mdx_dim_t_set": 9,
|
| 22 |
+
"mdx_n_fft_scale_set": 6144,
|
| 23 |
+
"primary_stem": "Other",
|
| 24 |
+
"name": "Reverb_HQ_By_FoxJoy.onnx"
|
| 25 |
+
},
|
| 26 |
+
"55657dd70583b0fedfba5f67df11d711": {
|
| 27 |
+
"compensate": 1.022,
|
| 28 |
+
"mdx_dim_f_set": 3072,
|
| 29 |
+
"mdx_dim_t_set": 8,
|
| 30 |
+
"mdx_n_fft_scale_set": 6144,
|
| 31 |
+
"primary_stem": "Instrumental",
|
| 32 |
+
"name": "UVR-MDX-NET-Inst_HQ_3.onnx"
|
| 33 |
+
},
|
| 34 |
+
"cc63408db3d80b4d85b0287d1d7c9632": {
|
| 35 |
+
"compensate": 1.033,
|
| 36 |
+
"mdx_dim_f_set": 3072,
|
| 37 |
+
"mdx_dim_t_set": 8,
|
| 38 |
+
"mdx_n_fft_scale_set": 6144,
|
| 39 |
+
"primary_stem": "Instrumental",
|
| 40 |
+
"name": "UVR-MDX-NET-Inst_HQ_2.onnx"
|
| 41 |
+
},
|
| 42 |
+
"0f2a6bc5b49d87d64728ee40e23bceb1": {
|
| 43 |
+
"compensate": 1.022,
|
| 44 |
+
"mdx_dim_f_set": 3072,
|
| 45 |
+
"mdx_dim_t_set": 8,
|
| 46 |
+
"mdx_n_fft_scale_set": 6144,
|
| 47 |
+
"primary_stem": "Instrumental",
|
| 48 |
+
"name": "UVR-MDX-NET-Inst_HQ_4.onnx"
|
| 49 |
+
}
|
| 50 |
+
}
|
models/mdxnet/source.txt
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
https://huggingface.co/masszhou/mdxnet
|