noblebarkrr commited on
Commit
80c40b6
·
verified ·
1 Parent(s): 6e99539

Немножко изменил список зависимостей и добавил ячейку для просмотра списка установленных моделей в Vbach

Browse files
Files changed (1) hide show
  1. MVSepLess_Epsilon_Colab.ipynb +54 -44
MVSepLess_Epsilon_Colab.ipynb CHANGED
@@ -18,63 +18,59 @@
18
  "%cd $home_dir\n",
19
  "!git clone $repo_url $mvsepless_dir\n",
20
  "%cd $mvsepless_dir\n",
21
- "!pip install uv\n",
22
  "req = \"\"\"\n",
23
- "torch==2.9.0\n",
24
- "torchvision==0.24.0\n",
25
- "torchaudio==2.9.0\n",
26
  "numpy==2.0.2\n",
27
  "pandas\n",
28
- "scipy==1.16.3\n",
29
- "librosa==0.11.0\n",
30
  "samplerate==0.1.0\n",
31
  "matplotlib\n",
32
- "tqdm==4.67.1\n",
33
- "einops==0.8.1\n",
34
- "protobuf==5.29.5\n",
35
- "soundfile==0.13.1\n",
36
- "pydub==0.25.1\n",
37
- "webrtcvad==2.0.10\n",
38
- "audiomentations==0.42.0\n",
39
  "pedalboard==0.8.2\n",
40
- "ffmpeg-python==0.2.0\n",
41
- "ml_collections==1.1.0\n",
42
- "timm==1.0.22\n",
43
- "wandb==0.23.0\n",
44
- "accelerate==1.12.0\n",
45
- "bitsandbytes==0.46.0\n",
46
- "tokenizers==0.22.1\n",
47
- "huggingface-hub==0.36.0\n",
48
- "transformers==4.57.2\n",
49
- "segmentation_models_pytorch==0.5.0\n",
50
- "torchseg==0.0.1a4\n",
51
  "demucs==4.0.0\n",
52
- "asteroid==0.7.0\n",
53
- "prodigyopt==1.1.2\n",
54
- "torch_log_wmse==0.3.0\n",
55
- "rotary_embedding_torch==0.6.5\n",
56
  "gradio\n",
57
- "omegaconf==2.3.0\n",
58
- "beartype==0.22.6\n",
59
- "spafe==0.3.2\n",
60
- "torch_audiomentations==0.12.0\n",
61
- "auraloss==0.4.0\n",
62
  "onnx>=1.17\n",
63
  "onnx2torch>=0.3.0\n",
64
  "onnxruntime-gpu>=1.17\n",
65
- "ml_dtypes==0.5.4\n",
66
  "resampy\n",
67
  "yt_dlp\n",
68
- "python-magic\n",
69
  "pyngrok\n",
70
  "tabulate\n",
71
- "gradio_modal\n",
72
  "neuraloperator==1.0.2\n",
73
- "torchcrepe==0.0.23\n",
74
- "praat-parselmouth==0.4.5\n",
75
  "faiss-cpu==1.11\n",
76
- "local-attention==1.11.1\n",
77
- "tenacity==9.1.2\n",
78
  "pyworld\n",
79
  "gdown\n",
80
  "\"\"\"\n",
@@ -147,7 +143,7 @@
147
  "\n",
148
  "input_url = \"\" # @param {\"type\":\"string\",\"placeholder\":\"Ссылка на аудио/видео\"}\n",
149
  "output_dir = \"/content/downloaded\" # @param {\"type\":\"string\",\"placeholder\":\"Директория для сохранения скачанного аудио\"}\n",
150
- "cookies_path = \"\" # @param {\"type\":\"string\",\"placeholder\":\"Путь к cookies (дял успешного скачивания с ютуба)\"}\n",
151
  "downloaded_file = dw_yt_dlp(url=input_url, output_dir=output_dir, cookie=cookies_path)\n"
152
  ],
153
  "metadata": {
@@ -329,7 +325,7 @@
329
  "#@markdown ---\n",
330
  "#@markdown ### Входные данные\n",
331
  "#@markdown * Путь к входной папке/файлу:\n",
332
- "input_path = \"\" # @param {\"type\":\"string\",\"placeholder\":\"/путь/к/файлу\"}\n",
333
  "#@markdown ---\n",
334
  "#@markdown ### Выбор модели\n",
335
  "#@markdown * Тип / Имя модели:\n",
@@ -385,6 +381,20 @@
385
  "id": "H24RtVB1YlE0"
386
  }
387
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
388
  {
389
  "cell_type": "markdown",
390
  "source": [
@@ -475,7 +485,7 @@
475
  "# @markdown ---\n",
476
  "# @markdown ### Hubert\n",
477
  "# @markdown * Стэк\n",
478
- "stack = \"fairseq\" # @param [\"fairseq\",\"transformers\"]\n",
479
  "# @markdown * Имя модели для fairseq\n",
480
  "fairseq_embedder = \"hubert_base\" # @param [\"hubert_base\",\"contentvec_base\",\"korean_hubert_base\",\"chinese_hubert_base\",\"portuguese_hubert_base\",\"japanese_hubert_base\"]\n",
481
  "# @markdown * Имя модели для transformers\n",
@@ -483,7 +493,7 @@
483
  "# @markdown ---\n",
484
  "# @markdown ### Настройки преобразования\n",
485
  "# @markdown * Влияние индекса\n",
486
- "index_rate = 0 # @param {\"type\":\"slider\",\"min\":0,\"max\":1,\"step\":0.01}\n",
487
  "# @markdown * Стерео режим\n",
488
  "stereo_mode = \"mono\" # @param [\"mono\",\"left/right\",\"sim/dif\"]\n",
489
  "# @markdown * Метод определения тона\n",
 
18
  "%cd $home_dir\n",
19
  "!git clone $repo_url $mvsepless_dir\n",
20
  "%cd $mvsepless_dir\n",
21
+ "!pip install --no-cache-dir uv\n",
22
  "req = \"\"\"\n",
23
+ "torch\n",
24
+ "torchvision\n",
25
+ "torchaudio\n",
26
  "numpy==2.0.2\n",
27
  "pandas\n",
28
+ "scipy\n",
29
+ "librosa\n",
30
  "samplerate==0.1.0\n",
31
  "matplotlib\n",
32
+ "tqdm\n",
33
+ "einops\n",
34
+ "protobuf\n",
35
+ "soundfile\n",
36
+ "pydub\n",
37
+ "webrtcvad\n",
38
+ "audiomentations\n",
39
  "pedalboard==0.8.2\n",
40
+ "ml_collections\n",
41
+ "timm\n",
42
+ "wandb\n",
43
+ "accelerate\n",
44
+ "bitsandbytes\n",
45
+ "tokenizers\n",
46
+ "huggingface-hub\n",
47
+ "transformers\n",
48
+ "torchseg\n",
 
 
49
  "demucs==4.0.0\n",
50
+ "asteroid\n",
51
+ "prodigyopt\n",
52
+ "torch_log_wmse\n",
53
+ "rotary_embedding_torch\n",
54
  "gradio\n",
55
+ "omegaconf\n",
56
+ "beartype\n",
57
+ "spafe\n",
58
+ "torch_audiomentations\n",
59
+ "auraloss\n",
60
  "onnx>=1.17\n",
61
  "onnx2torch>=0.3.0\n",
62
  "onnxruntime-gpu>=1.17\n",
63
+ "ml_dtypes\n",
64
  "resampy\n",
65
  "yt_dlp\n",
 
66
  "pyngrok\n",
67
  "tabulate\n",
 
68
  "neuraloperator==1.0.2\n",
69
+ "torchcrepe\n",
70
+ "praat-parselmouth\n",
71
  "faiss-cpu==1.11\n",
72
+ "local-attention\n",
73
+ "tenacity\n",
74
  "pyworld\n",
75
  "gdown\n",
76
  "\"\"\"\n",
 
143
  "\n",
144
  "input_url = \"\" # @param {\"type\":\"string\",\"placeholder\":\"Ссылка на аудио/видео\"}\n",
145
  "output_dir = \"/content/downloaded\" # @param {\"type\":\"string\",\"placeholder\":\"Директория для сохранения скачанного аудио\"}\n",
146
+ "cookies_path = \"\" # @param {\"type\":\"string\",\"placeholder\":\"Путь к cookies (для успешного скачивания с ютуба)\"}\n",
147
  "downloaded_file = dw_yt_dlp(url=input_url, output_dir=output_dir, cookie=cookies_path)\n"
148
  ],
149
  "metadata": {
 
325
  "#@markdown ---\n",
326
  "#@markdown ### Входные данные\n",
327
  "#@markdown * Путь к входной папке/файлу:\n",
328
+ "input_path = \"/content/musicboxtntblits_128kbit.mp3\" # @param {\"type\":\"string\",\"placeholder\":\"/путь/к/файлу\"}\n",
329
  "#@markdown ---\n",
330
  "#@markdown ### Выбор модели\n",
331
  "#@markdown * Тип / Имя модели:\n",
 
381
  "id": "H24RtVB1YlE0"
382
  }
383
  },
384
+ {
385
+ "cell_type": "code",
386
+ "execution_count": null,
387
+ "metadata": {
388
+ "cellView": "form",
389
+ "id": "JGme2oZOf_W3"
390
+ },
391
+ "outputs": [],
392
+ "source": [
393
+ "#@title Показать список установленных моделей для преобразования\n",
394
+ "%cd $mvsepless_dir\n",
395
+ "!python mvsepless/model_manager.py vbach list"
396
+ ]
397
+ },
398
  {
399
  "cell_type": "markdown",
400
  "source": [
 
485
  "# @markdown ---\n",
486
  "# @markdown ### Hubert\n",
487
  "# @markdown * Стэк\n",
488
+ "stack = \"transformers\" # @param [\"fairseq\",\"transformers\"]\n",
489
  "# @markdown * Имя модели для fairseq\n",
490
  "fairseq_embedder = \"hubert_base\" # @param [\"hubert_base\",\"contentvec_base\",\"korean_hubert_base\",\"chinese_hubert_base\",\"portuguese_hubert_base\",\"japanese_hubert_base\"]\n",
491
  "# @markdown * Имя модели для transformers\n",
 
493
  "# @markdown ---\n",
494
  "# @markdown ### Настройки преобразования\n",
495
  "# @markdown * Влияние индекса\n",
496
+ "index_rate = 1 # @param {\"type\":\"slider\",\"min\":0,\"max\":1,\"step\":0.01}\n",
497
  "# @markdown * Стерео режим\n",
498
  "stereo_mode = \"mono\" # @param [\"mono\",\"left/right\",\"sim/dif\"]\n",
499
  "# @markdown * Метод определения тона\n",