Aslamshahsyed blaise-tk commited on
Commit
142a67c
·
0 Parent(s):

Duplicate from IAHispano/Applio

Browse files

Co-authored-by: Blaise <blaise-tk@users.noreply.huggingface.co>

This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. .gitattributes +47 -0
  2. Compiled/.gitignore +0 -0
  3. Compiled/Linux/.gitignore +0 -0
  4. Compiled/Linux/ApplioV3.2.8-bugfix.zip +3 -0
  5. Compiled/Linux/ApplioV3.2.9.zip +3 -0
  6. Compiled/Linux/ApplioV3.3.0.zip +3 -0
  7. Compiled/Windows/.gitignore +0 -0
  8. Compiled/Windows/ApplioV3.2.8-bugfix.zip +3 -0
  9. Compiled/Windows/ApplioV3.2.9.zip +3 -0
  10. Compiled/Windows/ApplioV3.3.0.zip +3 -0
  11. Compiled/Windows/ApplioV3.3.1.zip +3 -0
  12. Compiled/Windows/ApplioV3.4.0.zip +3 -0
  13. Compiled/Windows/ApplioV3.5.0.zip +3 -0
  14. Compiled/Windows/ApplioV3.5.1.zip +3 -0
  15. Compiled/Windows/ApplioV3.6.0.zip +3 -0
  16. Compiled/Windows/ApplioV3.6.1.zip +3 -0
  17. Compiled/Windows/ApplioV3.6.2.zip +3 -0
  18. Enviroment/.gitignore +0 -0
  19. Enviroment/Colab/.gitignore +0 -0
  20. Enviroment/Colab/Pnpur.tar.gz +3 -0
  21. Enviroment/Colab/Pnpur_.tar.gz +3 -0
  22. Enviroment/Colab/tmp_packages.tar.gz +3 -0
  23. Enviroment/Kaggle/.gitignore +0 -0
  24. Enviroment/Kaggle/Kaggle.tar.gz +3 -0
  25. Enviroment/Kaggle/KaggleV2.tar.gz +3 -0
  26. Enviroment/Kaggle/bin_kaggle.tar.gz +3 -0
  27. README.md +100 -0
  28. Resources/contentvec_base.pt +3 -0
  29. Resources/embedders/chinese_hubert_base.pt +3 -0
  30. Resources/embedders/chinese_hubert_base/config.json +71 -0
  31. Resources/embedders/chinese_hubert_base/pytorch_model.bin +3 -0
  32. Resources/embedders/contentvec/config.json +71 -0
  33. Resources/embedders/contentvec/pytorch_model.bin +3 -0
  34. Resources/embedders/contentvec_base.pt +3 -0
  35. Resources/embedders/hubert_base.pt +3 -0
  36. Resources/embedders/japanese_hubert_base.pt +3 -0
  37. Resources/embedders/japanese_hubert_base/config.json +71 -0
  38. Resources/embedders/japanese_hubert_base/pytorch_model.bin +3 -0
  39. Resources/embedders/korean_hubert_base.pt +3 -0
  40. Resources/embedders/korean_hubert_base/config.json +78 -0
  41. Resources/embedders/korean_hubert_base/pytorch_model.bin +3 -0
  42. Resources/embedders/spin-v2/config.json +72 -0
  43. Resources/embedders/spin-v2/pytorch_model.bin +3 -0
  44. Resources/embedders/spin/config.json +71 -0
  45. Resources/embedders/spin/pytorch_model.bin +3 -0
  46. Resources/fcpe.pt +3 -0
  47. Resources/ffmpeg.exe +3 -0
  48. Resources/ffprobe.exe +3 -0
  49. Resources/formant/stftpitchshift +3 -0
  50. Resources/formant/stftpitchshift.exe +0 -0
.gitattributes ADDED
@@ -0,0 +1,47 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ *.7z filter=lfs diff=lfs merge=lfs -text
2
+ *.arrow filter=lfs diff=lfs merge=lfs -text
3
+ *.bin filter=lfs diff=lfs merge=lfs -text
4
+ *.bz2 filter=lfs diff=lfs merge=lfs -text
5
+ *.ckpt filter=lfs diff=lfs merge=lfs -text
6
+ *.ftz filter=lfs diff=lfs merge=lfs -text
7
+ *.gz filter=lfs diff=lfs merge=lfs -text
8
+ *.h5 filter=lfs diff=lfs merge=lfs -text
9
+ *.joblib filter=lfs diff=lfs merge=lfs -text
10
+ *.lfs.* filter=lfs diff=lfs merge=lfs -text
11
+ *.mlmodel filter=lfs diff=lfs merge=lfs -text
12
+ *.model filter=lfs diff=lfs merge=lfs -text
13
+ *.msgpack filter=lfs diff=lfs merge=lfs -text
14
+ *.npy filter=lfs diff=lfs merge=lfs -text
15
+ *.npz filter=lfs diff=lfs merge=lfs -text
16
+ *.onnx filter=lfs diff=lfs merge=lfs -text
17
+ *.ot filter=lfs diff=lfs merge=lfs -text
18
+ *.parquet filter=lfs diff=lfs merge=lfs -text
19
+ *.pb filter=lfs diff=lfs merge=lfs -text
20
+ *.pickle filter=lfs diff=lfs merge=lfs -text
21
+ *.pkl filter=lfs diff=lfs merge=lfs -text
22
+ *.pt filter=lfs diff=lfs merge=lfs -text
23
+ *.pth filter=lfs diff=lfs merge=lfs -text
24
+ *.rar filter=lfs diff=lfs merge=lfs -text
25
+ *.safetensors filter=lfs diff=lfs merge=lfs -text
26
+ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
27
+ *.tar.* filter=lfs diff=lfs merge=lfs -text
28
+ *.tar filter=lfs diff=lfs merge=lfs -text
29
+ *.tflite filter=lfs diff=lfs merge=lfs -text
30
+ *.tgz filter=lfs diff=lfs merge=lfs -text
31
+ *.wasm filter=lfs diff=lfs merge=lfs -text
32
+ *.xz filter=lfs diff=lfs merge=lfs -text
33
+ *.zip filter=lfs diff=lfs merge=lfs -text
34
+ *.zst filter=lfs diff=lfs merge=lfs -text
35
+ *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ Resources/ffmpeg.exe filter=lfs diff=lfs merge=lfs -text
37
+ Resources/ffprobe.exe filter=lfs diff=lfs merge=lfs -text
38
+ Compiled/ApplioV3.0.9.exe filter=lfs diff=lfs merge=lfs -text
39
+ Compiled/ApplioV3.1.0.exe filter=lfs diff=lfs merge=lfs -text
40
+ Compiled/ApplioV3.1.1.exe filter=lfs diff=lfs merge=lfs -text
41
+ Compiled/ApplioV3.5.0.exe filter=lfs diff=lfs merge=lfs -text
42
+ Compiled/ApplioV3.2.0.exe filter=lfs diff=lfs merge=lfs -text
43
+ Compiled/ApplioV3.2.1.exe filter=lfs diff=lfs merge=lfs -text
44
+ Compiled/ApplioV3.2.2.exe filter=lfs diff=lfs merge=lfs -text
45
+ Compiled/ApplioV3.2.3.exe filter=lfs diff=lfs merge=lfs -text
46
+ Compiled/ApplioV3.2.4.exe filter=lfs diff=lfs merge=lfs -text
47
+ Resources/formant/stftpitchshift filter=lfs diff=lfs merge=lfs -text
Compiled/.gitignore ADDED
File without changes
Compiled/Linux/.gitignore ADDED
File without changes
Compiled/Linux/ApplioV3.2.8-bugfix.zip ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f27ddea9bc182cbac1b2d809f329840ccc6bc1391b8b4918932fbbc396903d21
3
+ size 7544065874
Compiled/Linux/ApplioV3.2.9.zip ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5c4785a1c1d6c26ed01061b70e14f6cdba6d00646fffb2aed7b6ef5b10d07d59
3
+ size 7573040499
Compiled/Linux/ApplioV3.3.0.zip ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7a10298f10f85e8c49fa8d7490053fde5af3ce76446eb4d812cdfd3db9715c71
3
+ size 9575763753
Compiled/Windows/.gitignore ADDED
File without changes
Compiled/Windows/ApplioV3.2.8-bugfix.zip ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:42c68274095cc9d11930dd4a783acea7a9de641753ea1033431fbb07a88ef74b
3
+ size 4220255228
Compiled/Windows/ApplioV3.2.9.zip ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:87e6329870f36a31106913a627a1602a1abd84085884d875f83bd53f05b82941
3
+ size 4236244130
Compiled/Windows/ApplioV3.3.0.zip ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:641bddfded4e21b735397572420b34d09d1905c72939a9d629ce981f5fc68ea2
3
+ size 4873873650
Compiled/Windows/ApplioV3.3.1.zip ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:af3742262e0ea6724eeca188ad95f9910eccd658321ee2f8f2a88b51df6b4f50
3
+ size 4879206120
Compiled/Windows/ApplioV3.4.0.zip ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:071fb5ec31e12c7afc90aa3a8b1af4842840b44a7b14ccb2fd2b60e9e5268344
3
+ size 4879293026
Compiled/Windows/ApplioV3.5.0.zip ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dbe741466989905890d1e046909a6f8d26feaa0244c5defb43e8e116cf4cb6df
3
+ size 4899282098
Compiled/Windows/ApplioV3.5.1.zip ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1d8ac88f58aeb265e8a6651085479106410c3602cbe3f64918bc63f64ad768ec
3
+ size 4862979406
Compiled/Windows/ApplioV3.6.0.zip ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6dc30842d9dd28d330ad3a07afd052110e67cb8901c820bb0e5181054b5d79a2
3
+ size 5169475119
Compiled/Windows/ApplioV3.6.1.zip ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0c4f3a2eb8b0de1be5f1bf0d34f7437855eaf339c68ee7697d408c8e9cba6fc1
3
+ size 5475095742
Compiled/Windows/ApplioV3.6.2.zip ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0763606b8e0b2e2b75077eac5af2772a1682166a812acd9475622fe4c6fb1df9
3
+ size 5440885048
Enviroment/.gitignore ADDED
File without changes
Enviroment/Colab/.gitignore ADDED
File without changes
Enviroment/Colab/Pnpur.tar.gz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:edc00278eee827bf24237492b2a91ccdafdb98393a41ec9b4fff9d9a62b5abe6
3
+ size 2529458747
Enviroment/Colab/Pnpur_.tar.gz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aa42df46fbb0f7e9fad7d493a0ed317754920703be9d148122d766b4aef48ccf
3
+ size 3036863135
Enviroment/Colab/tmp_packages.tar.gz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:df6859c5c7f37bb664926db714bf68a9c2b909f03fa84644cddb1fa3b51a8682
3
+ size 30779249
Enviroment/Kaggle/.gitignore ADDED
File without changes
Enviroment/Kaggle/Kaggle.tar.gz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:221e9e89d15775a71f2458b30dee22c409f01e0ca9a9463fea43234c7dabc784
3
+ size 2909878809
Enviroment/Kaggle/KaggleV2.tar.gz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d1c19a66ca46bf47f56dd6e46633069b51997d7acd295e36c2e82dd87adc45d8
3
+ size 3249845631
Enviroment/Kaggle/bin_kaggle.tar.gz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:73e273205da615c7ebda701125fbfe08a701fa26d0658e958001c51c69197644
3
+ size 10203128
README.md ADDED
@@ -0,0 +1,100 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ pipeline_tag: audio-to-audio
3
+ tags:
4
+ - AI
5
+ - RVC
6
+ - VITS
7
+ - VC
8
+ - Voice Conversion
9
+ - Voice2Voice
10
+ license: mit
11
+ datasets:
12
+ - CSTR-Edinburgh/vctk
13
+ base_model:
14
+ - lj1995/VoiceConversionWebUI
15
+ ---
16
+
17
+ <h1 align="center">
18
+ <a href="https://applio.org" target="_blank"><img src="https://github.com/IAHispano/Applio/assets/133521603/78e975d8-b07f-47ba-ab23-5a31592f322a" alt="Applio"></a>
19
+ </h1>
20
+
21
+ <p align="center">A simple, high-quality voice conversion tool, focused on ease of use and performance.</p>
22
+
23
+ <p align="center">
24
+ <a href="https://applio.org" target="_blank">🌐 Website</a>
25
+
26
+ <a href="https://docs.applio.org" target="_blank">📚 Documentation</a>
27
+
28
+ <a href="https://discord.gg/urxFjYmYYh" target="_blank">☎️ Discord</a>
29
+ </p>
30
+
31
+ <p align="center">
32
+ <a href="https://github.com/IAHispano/Applio-Plugins" target="_blank">🛒 Plugins</a>
33
+
34
+ <a href="https://huggingface.co/IAHispano/Applio/tree/main/Compiled" target="_blank">📦 Compiled</a>
35
+
36
+ <a href="https://applio.org/playground" target="_blank">🎮 Playground</a>
37
+
38
+ <a href="https://colab.research.google.com/github/iahispano/applio/blob/master/assets/Applio.ipynb" target="_blank">🔎 Google Colab (UI)</a>
39
+
40
+ <a href="https://colab.research.google.com/github/iahispano/applio/blob/master/assets/Applio_NoUI.ipynb" target="_blank">🔎 Google Colab (No UI)</a>
41
+ </p>
42
+
43
+ ## Introduction
44
+
45
+ Applio is a powerful voice conversion tool focused on simplicity, quality, and performance. Whether you're an artist, developer, or researcher, Applio offers a straightforward platform for high-quality voice transformations. Its flexible design allows for customization through plugins and configurations, catering to a wide range of projects.
46
+
47
+ ## Terms of Use
48
+ The use of Applio is entirely at your own discretion and responsibility. By using this tool, you agree to:
49
+
50
+ 1. Respect all applicable copyrights, intellectual property rights, and privacy rights. Ensure that any audio or material processed through Applio is either owned by you or used with explicit permission from the rightful owner.
51
+
52
+ 2. Avoid using Applio in ways that may harm, defame, or infringe upon the rights of others. This includes, but is not limited to, the creation or distribution of unauthorized content.
53
+
54
+ 3. Comply with all relevant laws and regulations governing the use of AI and voice transformation tools in your jurisdiction.
55
+
56
+ Applio and its contributors are not liable for any misuse of the tool. The responsibility for adhering to ethical practices and legal compliance lies solely with the user. Applio does not endorse or support any activities that result in harm to individuals, groups, or entities. All official models distributed by Applio have been trained under public use datasets such as VCTK.
57
+
58
+ ## Getting Started
59
+
60
+ ### 1. Installation
61
+
62
+ Run the installation script based on your operating system:
63
+
64
+ - **Windows:** Double-click `run-install.bat`.
65
+ - **Linux/macOS:** Execute `run-install.sh`.
66
+
67
+ ### 2. Running Applio
68
+
69
+ Start Applio using:
70
+
71
+ - **Windows:** Double-click `run-applio.bat`.
72
+ - **Linux/macOS:** Run `run-applio.sh`.
73
+
74
+ This launches the Gradio interface in your default browser.
75
+
76
+ ### 3. Optional: TensorBoard Monitoring
77
+
78
+ To monitor training or visualize data:
79
+
80
+ - **Windows:** Run `run-tensorboard.bat`.
81
+ - **Linux/macOS:** Run `run-tensorboard.sh`.
82
+
83
+ For more detailed instructions, visit the [documentation](https://docs.applio.org).
84
+
85
+ ## Commercial Usage
86
+
87
+ For commercial use, follow the [MIT license](./LICENSE) and contact us at support@applio.org to ensure ethical use. The use of Applio-generated audio files must comply with applicable copyrights. Consider supporting Applio’s development [through a donation](https://ko-fi.com/iahispano).
88
+
89
+ ## References
90
+
91
+ Applio is made possible thanks to these projects and their references:
92
+
93
+ - [gradio-screen-recorder](https://huggingface.co/spaces/gstaff/gradio-screen-recorder) by gstaff
94
+ - [rvc-cli](https://github.com/blaisewf/rvc-cli) by blaisewf
95
+
96
+ ### Contributors
97
+
98
+ <a href="https://github.com/IAHispano/Applio/graphs/contributors" target="_blank">
99
+ <img src="https://contrib.rocks/image?repo=IAHispano/Applio" />
100
+ </a>
Resources/contentvec_base.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f54b40fd2802423a5643779c4861af1e9ee9c1564dc9d32f54f20b5ffba7db96
3
+ size 189507909
Resources/embedders/chinese_hubert_base.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8cd5db6302ae2e79b5972cd02ae375a42a76170374d6e1952fa78d1fe4e4f756
3
+ size 1136482241
Resources/embedders/chinese_hubert_base/config.json ADDED
@@ -0,0 +1,71 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "activation_dropout": 0.1,
3
+ "apply_spec_augment": true,
4
+ "architectures": [
5
+ "HubertModel"
6
+ ],
7
+ "attention_dropout": 0.1,
8
+ "bos_token_id": 1,
9
+ "classifier_proj_size": 256,
10
+ "conv_bias": false,
11
+ "conv_dim": [
12
+ 512,
13
+ 512,
14
+ 512,
15
+ 512,
16
+ 512,
17
+ 512,
18
+ 512
19
+ ],
20
+ "conv_kernel": [
21
+ 10,
22
+ 3,
23
+ 3,
24
+ 3,
25
+ 3,
26
+ 2,
27
+ 2
28
+ ],
29
+ "conv_stride": [
30
+ 5,
31
+ 2,
32
+ 2,
33
+ 2,
34
+ 2,
35
+ 2,
36
+ 2
37
+ ],
38
+ "ctc_loss_reduction": "sum",
39
+ "ctc_zero_infinity": false,
40
+ "do_stable_layer_norm": false,
41
+ "eos_token_id": 2,
42
+ "feat_extract_activation": "gelu",
43
+ "feat_extract_norm": "group",
44
+ "feat_proj_dropout": 0.0,
45
+ "feat_proj_layer_norm": true,
46
+ "final_dropout": 0.1,
47
+ "hidden_act": "gelu",
48
+ "hidden_dropout": 0.1,
49
+ "hidden_size": 768,
50
+ "initializer_range": 0.02,
51
+ "intermediate_size": 3072,
52
+ "layer_norm_eps": 1e-05,
53
+ "layerdrop": 0.1,
54
+ "mask_feature_length": 10,
55
+ "mask_feature_min_masks": 0,
56
+ "mask_feature_prob": 0.0,
57
+ "mask_time_length": 10,
58
+ "mask_time_min_masks": 2,
59
+ "mask_time_prob": 0.05,
60
+ "model_type": "hubert",
61
+ "num_attention_heads": 12,
62
+ "num_conv_pos_embedding_groups": 16,
63
+ "num_conv_pos_embeddings": 128,
64
+ "num_feat_extract_layers": 7,
65
+ "num_hidden_layers": 12,
66
+ "pad_token_id": 0,
67
+ "torch_dtype": "float32",
68
+ "transformers_version": "4.20.0.dev0",
69
+ "use_weighted_layer_sum": false,
70
+ "vocab_size": 32
71
+ }
Resources/embedders/chinese_hubert_base/pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2fefccd26c2794a583b80f6f7210c721873cb7ebae2c1cde3baf9b27855e24d8
3
+ size 377552987
Resources/embedders/contentvec/config.json ADDED
@@ -0,0 +1,71 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "activation_dropout": 0.1,
3
+ "apply_spec_augment": true,
4
+ "architectures": [
5
+ "HubertModelWithFinalProj"
6
+ ],
7
+ "attention_dropout": 0.1,
8
+ "bos_token_id": 1,
9
+ "classifier_proj_size": 256,
10
+ "conv_bias": false,
11
+ "conv_dim": [
12
+ 512,
13
+ 512,
14
+ 512,
15
+ 512,
16
+ 512,
17
+ 512,
18
+ 512
19
+ ],
20
+ "conv_kernel": [
21
+ 10,
22
+ 3,
23
+ 3,
24
+ 3,
25
+ 3,
26
+ 2,
27
+ 2
28
+ ],
29
+ "conv_stride": [
30
+ 5,
31
+ 2,
32
+ 2,
33
+ 2,
34
+ 2,
35
+ 2,
36
+ 2
37
+ ],
38
+ "ctc_loss_reduction": "sum",
39
+ "ctc_zero_infinity": false,
40
+ "do_stable_layer_norm": false,
41
+ "eos_token_id": 2,
42
+ "feat_extract_activation": "gelu",
43
+ "feat_extract_norm": "group",
44
+ "feat_proj_dropout": 0.0,
45
+ "feat_proj_layer_norm": true,
46
+ "final_dropout": 0.1,
47
+ "hidden_act": "gelu",
48
+ "hidden_dropout": 0.1,
49
+ "hidden_size": 768,
50
+ "initializer_range": 0.02,
51
+ "intermediate_size": 3072,
52
+ "layer_norm_eps": 1e-05,
53
+ "layerdrop": 0.1,
54
+ "mask_feature_length": 10,
55
+ "mask_feature_min_masks": 0,
56
+ "mask_feature_prob": 0.0,
57
+ "mask_time_length": 10,
58
+ "mask_time_min_masks": 2,
59
+ "mask_time_prob": 0.05,
60
+ "model_type": "hubert",
61
+ "num_attention_heads": 12,
62
+ "num_conv_pos_embedding_groups": 16,
63
+ "num_conv_pos_embeddings": 128,
64
+ "num_feat_extract_layers": 7,
65
+ "num_hidden_layers": 12,
66
+ "pad_token_id": 0,
67
+ "torch_dtype": "float32",
68
+ "transformers_version": "4.27.3",
69
+ "use_weighted_layer_sum": false,
70
+ "vocab_size": 32
71
+ }
Resources/embedders/contentvec/pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d8dd400e054ddf4e6be75dab5a2549db748cc99e756a097c496c099f65a4854e
3
+ size 378342945
Resources/embedders/contentvec_base.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f54b40fd2802423a5643779c4861af1e9ee9c1564dc9d32f54f20b5ffba7db96
3
+ size 189507909
Resources/embedders/hubert_base.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f54b40fd2802423a5643779c4861af1e9ee9c1564dc9d32f54f20b5ffba7db96
3
+ size 189507909
Resources/embedders/japanese_hubert_base.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dade3cf824ae0d214f7de8b73e70bae7c101e81f12d93577c4760bf516db4063
3
+ size 378888853
Resources/embedders/japanese_hubert_base/config.json ADDED
@@ -0,0 +1,71 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "activation_dropout": 0.1,
3
+ "apply_spec_augment": true,
4
+ "architectures": [
5
+ "HubertModel"
6
+ ],
7
+ "attention_dropout": 0.1,
8
+ "bos_token_id": 1,
9
+ "classifier_proj_size": 256,
10
+ "conv_bias": false,
11
+ "conv_dim": [
12
+ 512,
13
+ 512,
14
+ 512,
15
+ 512,
16
+ 512,
17
+ 512,
18
+ 512
19
+ ],
20
+ "conv_kernel": [
21
+ 10,
22
+ 3,
23
+ 3,
24
+ 3,
25
+ 3,
26
+ 2,
27
+ 2
28
+ ],
29
+ "conv_stride": [
30
+ 5,
31
+ 2,
32
+ 2,
33
+ 2,
34
+ 2,
35
+ 2,
36
+ 2
37
+ ],
38
+ "ctc_loss_reduction": "sum",
39
+ "ctc_zero_infinity": false,
40
+ "do_stable_layer_norm": false,
41
+ "eos_token_id": 2,
42
+ "feat_extract_activation": "gelu",
43
+ "feat_extract_norm": "group",
44
+ "feat_proj_dropout": 0.0,
45
+ "feat_proj_layer_norm": true,
46
+ "final_dropout": 0.1,
47
+ "hidden_act": "gelu",
48
+ "hidden_dropout": 0.1,
49
+ "hidden_size": 768,
50
+ "initializer_range": 0.02,
51
+ "intermediate_size": 3072,
52
+ "layer_norm_eps": 1e-05,
53
+ "layerdrop": 0.1,
54
+ "mask_feature_length": 10,
55
+ "mask_feature_min_masks": 0,
56
+ "mask_feature_prob": 0.0,
57
+ "mask_time_length": 10,
58
+ "mask_time_min_masks": 2,
59
+ "mask_time_prob": 0.05,
60
+ "model_type": "hubert",
61
+ "num_attention_heads": 12,
62
+ "num_conv_pos_embedding_groups": 16,
63
+ "num_conv_pos_embeddings": 128,
64
+ "num_feat_extract_layers": 7,
65
+ "num_hidden_layers": 12,
66
+ "pad_token_id": 0,
67
+ "torch_dtype": "float32",
68
+ "transformers_version": "4.28.1",
69
+ "use_weighted_layer_sum": false,
70
+ "vocab_size": 32
71
+ }
Resources/embedders/japanese_hubert_base/pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6c023ccb71e4c2b5a324c94fc5ebe12403d3081c5f370df229892419996fd113
3
+ size 377554841
Resources/embedders/korean_hubert_base.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6b42c8453b96b203198c1c280a8821158ea3fa8dbbc2a6220cad1c1489c3e65e
3
+ size 378876997
Resources/embedders/korean_hubert_base/config.json ADDED
@@ -0,0 +1,78 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "activation_dropout": 0.1,
3
+ "apply_spec_augment": true,
4
+ "architectures": [
5
+ "HubertModel"
6
+ ],
7
+ "auto_map": {
8
+ "FlaxAutoModel": "modeling_flax_hubert.FlaxHubertModel"
9
+ },
10
+ "attention_dropout": 0.1,
11
+ "bos_token_id": 1,
12
+ "conv_bias": false,
13
+ "conv_dim": [
14
+ 512,
15
+ 512,
16
+ 512,
17
+ 512,
18
+ 512,
19
+ 512,
20
+ 512
21
+ ],
22
+ "conv_kernel": [
23
+ 10,
24
+ 3,
25
+ 3,
26
+ 3,
27
+ 3,
28
+ 2,
29
+ 2
30
+ ],
31
+ "conv_stride": [
32
+ 5,
33
+ 2,
34
+ 2,
35
+ 2,
36
+ 2,
37
+ 2,
38
+ 2
39
+ ],
40
+ "ctc_loss_reduction": "sum",
41
+ "ctc_zero_infinity": false,
42
+ "do_stable_layer_norm": false,
43
+ "eos_token_id": 2,
44
+ "feat_extract_activation": "gelu",
45
+ "feat_extract_dropout": 0.0,
46
+ "feat_extract_norm": "group",
47
+ "feat_proj_dropout": 0.1,
48
+ "feat_proj_layer_norm": true,
49
+ "final_dropout": 0.1,
50
+ "final_proj_size": 256,
51
+ "gradient_checkpointing": false,
52
+ "hidden_act": "gelu",
53
+ "hidden_dropout": 0.1,
54
+ "hidden_dropout_prob": 0.1,
55
+ "hidden_size": 768,
56
+ "initializer_range": 0.02,
57
+ "intermediate_size": 3072,
58
+ "layer_norm_eps": 1e-05,
59
+ "layerdrop": 0.1,
60
+ "mask_feature_length": 10,
61
+ "mask_feature_min_masks": 0,
62
+ "mask_feature_prob": 0.0,
63
+ "mask_time_length": 10,
64
+ "mask_time_min_masks": 2,
65
+ "mask_time_prob": 0.05,
66
+ "model_type": "hubert",
67
+ "num_attention_heads": 12,
68
+ "num_conv_pos_embedding_groups": 16,
69
+ "num_conv_pos_embeddings": 128,
70
+ "num_feat_extract_layers": 7,
71
+ "num_hidden_layers": 12,
72
+ "pad_token_id": 0,
73
+ "tokenizer_class": "Wav2Vec2CTCTokenizer",
74
+ "torch_dtype": "float32",
75
+ "transformers_version": "4.30.0.dev0",
76
+ "use_weighted_layer_sum": false,
77
+ "vocab_size": 32
78
+ }
Resources/embedders/korean_hubert_base/pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:931f6232879f8eadf7dbd9e00e1fa4cac61ad269af89d509b2ed75009b1a02c5
3
+ size 377554841
Resources/embedders/spin-v2/config.json ADDED
@@ -0,0 +1,72 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "activation_dropout": 0.1,
3
+ "apply_spec_augment": true,
4
+ "architectures": [
5
+ "HubertModelWithFinalProj"
6
+ ],
7
+ "attention_dropout": 0.1,
8
+ "bos_token_id": 1,
9
+ "classifier_proj_size": 256,
10
+ "conv_bias": false,
11
+ "conv_dim": [
12
+ 512,
13
+ 512,
14
+ 512,
15
+ 512,
16
+ 512,
17
+ 512,
18
+ 512
19
+ ],
20
+ "conv_kernel": [
21
+ 10,
22
+ 3,
23
+ 3,
24
+ 3,
25
+ 3,
26
+ 2,
27
+ 2
28
+ ],
29
+ "conv_pos_batch_norm": false,
30
+ "conv_stride": [
31
+ 5,
32
+ 2,
33
+ 2,
34
+ 2,
35
+ 2,
36
+ 2,
37
+ 2
38
+ ],
39
+ "ctc_loss_reduction": "sum",
40
+ "ctc_zero_infinity": false,
41
+ "do_stable_layer_norm": false,
42
+ "eos_token_id": 2,
43
+ "feat_extract_activation": "gelu",
44
+ "feat_extract_norm": "group",
45
+ "feat_proj_dropout": 0.0,
46
+ "feat_proj_layer_norm": true,
47
+ "final_dropout": 0.1,
48
+ "hidden_act": "gelu",
49
+ "hidden_dropout": 0.1,
50
+ "hidden_size": 768,
51
+ "initializer_range": 0.02,
52
+ "intermediate_size": 3072,
53
+ "layer_norm_eps": 1e-05,
54
+ "layerdrop": 0.1,
55
+ "mask_feature_length": 10,
56
+ "mask_feature_min_masks": 0,
57
+ "mask_feature_prob": 0.0,
58
+ "mask_time_length": 10,
59
+ "mask_time_min_masks": 2,
60
+ "mask_time_prob": 0.05,
61
+ "model_type": "hubert",
62
+ "num_attention_heads": 12,
63
+ "num_conv_pos_embedding_groups": 16,
64
+ "num_conv_pos_embeddings": 128,
65
+ "num_feat_extract_layers": 7,
66
+ "num_hidden_layers": 12,
67
+ "pad_token_id": 0,
68
+ "torch_dtype": "float32",
69
+ "transformers_version": "4.55.0",
70
+ "use_weighted_layer_sum": false,
71
+ "vocab_size": 32
72
+ }
Resources/embedders/spin-v2/pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9a9ac0be326057b17607a988be497793817f8274e987cf691a1b61192510f823
3
+ size 378356791
Resources/embedders/spin/config.json ADDED
@@ -0,0 +1,71 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "activation_dropout": 0.1,
3
+ "apply_spec_augment": true,
4
+ "architectures": [
5
+ "HubertModelWithFinalProj"
6
+ ],
7
+ "attention_dropout": 0.1,
8
+ "bos_token_id": 1,
9
+ "classifier_proj_size": 256,
10
+ "conv_bias": false,
11
+ "conv_dim": [
12
+ 512,
13
+ 512,
14
+ 512,
15
+ 512,
16
+ 512,
17
+ 512,
18
+ 512
19
+ ],
20
+ "conv_kernel": [
21
+ 10,
22
+ 3,
23
+ 3,
24
+ 3,
25
+ 3,
26
+ 2,
27
+ 2
28
+ ],
29
+ "conv_stride": [
30
+ 5,
31
+ 2,
32
+ 2,
33
+ 2,
34
+ 2,
35
+ 2,
36
+ 2
37
+ ],
38
+ "ctc_loss_reduction": "sum",
39
+ "ctc_zero_infinity": false,
40
+ "do_stable_layer_norm": false,
41
+ "eos_token_id": 2,
42
+ "feat_extract_activation": "gelu",
43
+ "feat_extract_norm": "group",
44
+ "feat_proj_dropout": 0.0,
45
+ "feat_proj_layer_norm": true,
46
+ "final_dropout": 0.1,
47
+ "hidden_act": "gelu",
48
+ "hidden_dropout": 0.1,
49
+ "hidden_size": 768,
50
+ "initializer_range": 0.02,
51
+ "intermediate_size": 3072,
52
+ "layer_norm_eps": 1e-05,
53
+ "layerdrop": 0.1,
54
+ "mask_feature_length": 10,
55
+ "mask_feature_min_masks": 0,
56
+ "mask_feature_prob": 0.0,
57
+ "mask_time_length": 10,
58
+ "mask_time_min_masks": 2,
59
+ "mask_time_prob": 0.05,
60
+ "model_type": "hubert",
61
+ "num_attention_heads": 12,
62
+ "num_conv_pos_embedding_groups": 16,
63
+ "num_conv_pos_embeddings": 128,
64
+ "num_feat_extract_layers": 7,
65
+ "num_hidden_layers": 12,
66
+ "pad_token_id": 0,
67
+ "torch_dtype": "float32",
68
+ "transformers_version": "4.44.2",
69
+ "use_weighted_layer_sum": false,
70
+ "vocab_size": 32
71
+ }
Resources/embedders/spin/pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:057f12bfda54e2d486d86a52a3beb2a07c96a888bc6ac0c382c12ac18dbd500c
3
+ size 378356791
Resources/fcpe.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8544427eebbf2baef6213cc9a05057e46961617a8e5bd96975a0d42da6a09059
3
+ size 43362881
Resources/ffmpeg.exe ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b6a4d917a444790f4c06ada640c1c0c95aecde2f8953ed8d0dfb19352500bfcd
3
+ size 52925440
Resources/ffprobe.exe ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2da5b980a9a14a808f423d181c4ed51c2b8af11b1366699f3f7eab0609926f8f
3
+ size 122135040
Resources/formant/stftpitchshift ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eb2f50ea8e5ca1a11a587f11f25ba9182f9b24e2367ac480f430b3f04062782e
3
+ size 1822104
Resources/formant/stftpitchshift.exe ADDED
Binary file (276 kB). View file