Немножко изменил список зависимостей и добавил ячейку для просмотра списка установленных моделей в Vbach
Browse files- MVSepLess_Epsilon_Colab.ipynb +54 -44
MVSepLess_Epsilon_Colab.ipynb
CHANGED
|
@@ -18,63 +18,59 @@
|
|
| 18 |
"%cd $home_dir\n",
|
| 19 |
"!git clone $repo_url $mvsepless_dir\n",
|
| 20 |
"%cd $mvsepless_dir\n",
|
| 21 |
-
"!pip install uv\n",
|
| 22 |
"req = \"\"\"\n",
|
| 23 |
-
"torch
|
| 24 |
-
"torchvision
|
| 25 |
-
"torchaudio
|
| 26 |
"numpy==2.0.2\n",
|
| 27 |
"pandas\n",
|
| 28 |
-
"scipy
|
| 29 |
-
"librosa
|
| 30 |
"samplerate==0.1.0\n",
|
| 31 |
"matplotlib\n",
|
| 32 |
-
"tqdm
|
| 33 |
-
"einops
|
| 34 |
-
"protobuf
|
| 35 |
-
"soundfile
|
| 36 |
-
"pydub
|
| 37 |
-
"webrtcvad
|
| 38 |
-
"audiomentations
|
| 39 |
"pedalboard==0.8.2\n",
|
| 40 |
-
"
|
| 41 |
-
"
|
| 42 |
-
"
|
| 43 |
-
"
|
| 44 |
-
"
|
| 45 |
-
"
|
| 46 |
-
"
|
| 47 |
-
"
|
| 48 |
-
"
|
| 49 |
-
"segmentation_models_pytorch==0.5.0\n",
|
| 50 |
-
"torchseg==0.0.1a4\n",
|
| 51 |
"demucs==4.0.0\n",
|
| 52 |
-
"asteroid
|
| 53 |
-
"prodigyopt
|
| 54 |
-
"torch_log_wmse
|
| 55 |
-
"rotary_embedding_torch
|
| 56 |
"gradio\n",
|
| 57 |
-
"omegaconf
|
| 58 |
-
"beartype
|
| 59 |
-
"spafe
|
| 60 |
-
"torch_audiomentations
|
| 61 |
-
"auraloss
|
| 62 |
"onnx>=1.17\n",
|
| 63 |
"onnx2torch>=0.3.0\n",
|
| 64 |
"onnxruntime-gpu>=1.17\n",
|
| 65 |
-
"ml_dtypes
|
| 66 |
"resampy\n",
|
| 67 |
"yt_dlp\n",
|
| 68 |
-
"python-magic\n",
|
| 69 |
"pyngrok\n",
|
| 70 |
"tabulate\n",
|
| 71 |
-
"gradio_modal\n",
|
| 72 |
"neuraloperator==1.0.2\n",
|
| 73 |
-
"torchcrepe
|
| 74 |
-
"praat-parselmouth
|
| 75 |
"faiss-cpu==1.11\n",
|
| 76 |
-
"local-attention
|
| 77 |
-
"tenacity
|
| 78 |
"pyworld\n",
|
| 79 |
"gdown\n",
|
| 80 |
"\"\"\"\n",
|
|
@@ -147,7 +143,7 @@
|
|
| 147 |
"\n",
|
| 148 |
"input_url = \"\" # @param {\"type\":\"string\",\"placeholder\":\"Ссылка на аудио/видео\"}\n",
|
| 149 |
"output_dir = \"/content/downloaded\" # @param {\"type\":\"string\",\"placeholder\":\"Директория для сохранения скачанного аудио\"}\n",
|
| 150 |
-
"cookies_path = \"\" # @param {\"type\":\"string\",\"placeholder\":\"Путь к cookies (д
|
| 151 |
"downloaded_file = dw_yt_dlp(url=input_url, output_dir=output_dir, cookie=cookies_path)\n"
|
| 152 |
],
|
| 153 |
"metadata": {
|
|
@@ -329,7 +325,7 @@
|
|
| 329 |
"#@markdown ---\n",
|
| 330 |
"#@markdown ### Входные данные\n",
|
| 331 |
"#@markdown * Путь к входной папке/файлу:\n",
|
| 332 |
-
"input_path = \"\" # @param {\"type\":\"string\",\"placeholder\":\"/путь/к/файлу\"}\n",
|
| 333 |
"#@markdown ---\n",
|
| 334 |
"#@markdown ### Выбор модели\n",
|
| 335 |
"#@markdown * Тип / Имя модели:\n",
|
|
@@ -385,6 +381,20 @@
|
|
| 385 |
"id": "H24RtVB1YlE0"
|
| 386 |
}
|
| 387 |
},
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 388 |
{
|
| 389 |
"cell_type": "markdown",
|
| 390 |
"source": [
|
|
@@ -475,7 +485,7 @@
|
|
| 475 |
"# @markdown ---\n",
|
| 476 |
"# @markdown ### Hubert\n",
|
| 477 |
"# @markdown * Стэк\n",
|
| 478 |
-
"stack = \"
|
| 479 |
"# @markdown * Имя модели для fairseq\n",
|
| 480 |
"fairseq_embedder = \"hubert_base\" # @param [\"hubert_base\",\"contentvec_base\",\"korean_hubert_base\",\"chinese_hubert_base\",\"portuguese_hubert_base\",\"japanese_hubert_base\"]\n",
|
| 481 |
"# @markdown * Имя модели для transformers\n",
|
|
@@ -483,7 +493,7 @@
|
|
| 483 |
"# @markdown ---\n",
|
| 484 |
"# @markdown ### Настройки преобразования\n",
|
| 485 |
"# @markdown * Влияние индекса\n",
|
| 486 |
-
"index_rate =
|
| 487 |
"# @markdown * Стерео режим\n",
|
| 488 |
"stereo_mode = \"mono\" # @param [\"mono\",\"left/right\",\"sim/dif\"]\n",
|
| 489 |
"# @markdown * Метод определения тона\n",
|
|
|
|
| 18 |
"%cd $home_dir\n",
|
| 19 |
"!git clone $repo_url $mvsepless_dir\n",
|
| 20 |
"%cd $mvsepless_dir\n",
|
| 21 |
+
"!pip install --no-cache-dir uv\n",
|
| 22 |
"req = \"\"\"\n",
|
| 23 |
+
"torch\n",
|
| 24 |
+
"torchvision\n",
|
| 25 |
+
"torchaudio\n",
|
| 26 |
"numpy==2.0.2\n",
|
| 27 |
"pandas\n",
|
| 28 |
+
"scipy\n",
|
| 29 |
+
"librosa\n",
|
| 30 |
"samplerate==0.1.0\n",
|
| 31 |
"matplotlib\n",
|
| 32 |
+
"tqdm\n",
|
| 33 |
+
"einops\n",
|
| 34 |
+
"protobuf\n",
|
| 35 |
+
"soundfile\n",
|
| 36 |
+
"pydub\n",
|
| 37 |
+
"webrtcvad\n",
|
| 38 |
+
"audiomentations\n",
|
| 39 |
"pedalboard==0.8.2\n",
|
| 40 |
+
"ml_collections\n",
|
| 41 |
+
"timm\n",
|
| 42 |
+
"wandb\n",
|
| 43 |
+
"accelerate\n",
|
| 44 |
+
"bitsandbytes\n",
|
| 45 |
+
"tokenizers\n",
|
| 46 |
+
"huggingface-hub\n",
|
| 47 |
+
"transformers\n",
|
| 48 |
+
"torchseg\n",
|
|
|
|
|
|
|
| 49 |
"demucs==4.0.0\n",
|
| 50 |
+
"asteroid\n",
|
| 51 |
+
"prodigyopt\n",
|
| 52 |
+
"torch_log_wmse\n",
|
| 53 |
+
"rotary_embedding_torch\n",
|
| 54 |
"gradio\n",
|
| 55 |
+
"omegaconf\n",
|
| 56 |
+
"beartype\n",
|
| 57 |
+
"spafe\n",
|
| 58 |
+
"torch_audiomentations\n",
|
| 59 |
+
"auraloss\n",
|
| 60 |
"onnx>=1.17\n",
|
| 61 |
"onnx2torch>=0.3.0\n",
|
| 62 |
"onnxruntime-gpu>=1.17\n",
|
| 63 |
+
"ml_dtypes\n",
|
| 64 |
"resampy\n",
|
| 65 |
"yt_dlp\n",
|
|
|
|
| 66 |
"pyngrok\n",
|
| 67 |
"tabulate\n",
|
|
|
|
| 68 |
"neuraloperator==1.0.2\n",
|
| 69 |
+
"torchcrepe\n",
|
| 70 |
+
"praat-parselmouth\n",
|
| 71 |
"faiss-cpu==1.11\n",
|
| 72 |
+
"local-attention\n",
|
| 73 |
+
"tenacity\n",
|
| 74 |
"pyworld\n",
|
| 75 |
"gdown\n",
|
| 76 |
"\"\"\"\n",
|
|
|
|
| 143 |
"\n",
|
| 144 |
"input_url = \"\" # @param {\"type\":\"string\",\"placeholder\":\"Ссылка на аудио/видео\"}\n",
|
| 145 |
"output_dir = \"/content/downloaded\" # @param {\"type\":\"string\",\"placeholder\":\"Директория для сохранения скачанного аудио\"}\n",
|
| 146 |
+
"cookies_path = \"\" # @param {\"type\":\"string\",\"placeholder\":\"Путь к cookies (для успешного скачивания с ютуба)\"}\n",
|
| 147 |
"downloaded_file = dw_yt_dlp(url=input_url, output_dir=output_dir, cookie=cookies_path)\n"
|
| 148 |
],
|
| 149 |
"metadata": {
|
|
|
|
| 325 |
"#@markdown ---\n",
|
| 326 |
"#@markdown ### Входные данные\n",
|
| 327 |
"#@markdown * Путь к входной папке/файлу:\n",
|
| 328 |
+
"input_path = \"/content/musicboxtntblits_128kbit.mp3\" # @param {\"type\":\"string\",\"placeholder\":\"/путь/к/файлу\"}\n",
|
| 329 |
"#@markdown ---\n",
|
| 330 |
"#@markdown ### Выбор модели\n",
|
| 331 |
"#@markdown * Тип / Имя модели:\n",
|
|
|
|
| 381 |
"id": "H24RtVB1YlE0"
|
| 382 |
}
|
| 383 |
},
|
| 384 |
+
{
|
| 385 |
+
"cell_type": "code",
|
| 386 |
+
"execution_count": null,
|
| 387 |
+
"metadata": {
|
| 388 |
+
"cellView": "form",
|
| 389 |
+
"id": "JGme2oZOf_W3"
|
| 390 |
+
},
|
| 391 |
+
"outputs": [],
|
| 392 |
+
"source": [
|
| 393 |
+
"#@title Показать список установленных моделей для преобразования\n",
|
| 394 |
+
"%cd $mvsepless_dir\n",
|
| 395 |
+
"!python mvsepless/model_manager.py vbach list"
|
| 396 |
+
]
|
| 397 |
+
},
|
| 398 |
{
|
| 399 |
"cell_type": "markdown",
|
| 400 |
"source": [
|
|
|
|
| 485 |
"# @markdown ---\n",
|
| 486 |
"# @markdown ### Hubert\n",
|
| 487 |
"# @markdown * Стэк\n",
|
| 488 |
+
"stack = \"transformers\" # @param [\"fairseq\",\"transformers\"]\n",
|
| 489 |
"# @markdown * Имя модели для fairseq\n",
|
| 490 |
"fairseq_embedder = \"hubert_base\" # @param [\"hubert_base\",\"contentvec_base\",\"korean_hubert_base\",\"chinese_hubert_base\",\"portuguese_hubert_base\",\"japanese_hubert_base\"]\n",
|
| 491 |
"# @markdown * Имя модели для transformers\n",
|
|
|
|
| 493 |
"# @markdown ---\n",
|
| 494 |
"# @markdown ### Настройки преобразования\n",
|
| 495 |
"# @markdown * Влияние индекса\n",
|
| 496 |
+
"index_rate = 1 # @param {\"type\":\"slider\",\"min\":0,\"max\":1,\"step\":0.01}\n",
|
| 497 |
"# @markdown * Стерео режим\n",
|
| 498 |
"stereo_mode = \"mono\" # @param [\"mono\",\"left/right\",\"sim/dif\"]\n",
|
| 499 |
"# @markdown * Метод определения тона\n",
|