diff --git a/so_vits_svc_4/Apple Bloom (singing, PS1)/speaker.json b/so_vits_svc_4/Apple Bloom (singing, PS1)/speaker.json deleted file mode 100644 index 788eb813941a6a0a78a06a8c4e28ad13e122e391..0000000000000000000000000000000000000000 --- a/so_vits_svc_4/Apple Bloom (singing, PS1)/speaker.json +++ /dev/null @@ -1,3 +0,0 @@ -{ - "speaker": "Applebloom (singing)" -} \ No newline at end of file diff --git a/so_vits_svc_4/Applejack (singing, PS1)/speaker.json b/so_vits_svc_4/Applejack (singing, PS1)/speaker.json deleted file mode 100644 index 0466242f621d74913f216d34206a6bbee39d1ceb..0000000000000000000000000000000000000000 --- a/so_vits_svc_4/Applejack (singing, PS1)/speaker.json +++ /dev/null @@ -1,3 +0,0 @@ -{ - "speaker": "Applejack (singing)" -} \ No newline at end of file diff --git a/so_vits_svc_4/Babs Seed (alt)/speaker.json b/so_vits_svc_4/Babs Seed (alt)/speaker.json deleted file mode 100644 index 6bcdfbde4fa501701e7673df190032f44ac9b3b8..0000000000000000000000000000000000000000 --- a/so_vits_svc_4/Babs Seed (alt)/speaker.json +++ /dev/null @@ -1,3 +0,0 @@ -{ - "speaker": "Babs-Seed" -} diff --git a/so_vits_svc_4/Babs Seed/G_1668.pth b/so_vits_svc_4/Babs Seed/G_1668.pth deleted file mode 100644 index 1cc0ee3c08c7477b4bac4aac774cbf4761e14967..0000000000000000000000000000000000000000 --- a/so_vits_svc_4/Babs Seed/G_1668.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:abd4211820f140813b9457b1443c0ca212c21e3c8a357b7c7446ec9620787f18 -size 548687709 diff --git a/so_vits_svc_4/Babs Seed/README.txt b/so_vits_svc_4/Babs Seed/README.txt deleted file mode 100644 index f68638f98fd77a7da412f5f069f2f1a822eb6b57..0000000000000000000000000000000000000000 --- a/so_vits_svc_4/Babs Seed/README.txt +++ /dev/null @@ -1,4 +0,0 @@ -Originally uploaded by ThunderAnon: -https://drive.google.com/drive/folders/1F0_Idv8G3s0R7RWxF_PctdxnAWUeyH_C?usp=sharing -Each zip and rar file in that link contained a large D_.pth file which is not needed for inference, -so I have reuploaded just the necessary files to the reduce the download time for Hay Say. \ No newline at end of file diff --git a/so_vits_svc_4/Babs Seed/config.json b/so_vits_svc_4/Babs Seed/config.json deleted file mode 100644 index f93dacee7c202cdfe6ca4b3db8ec6fec679a8486..0000000000000000000000000000000000000000 --- a/so_vits_svc_4/Babs Seed/config.json +++ /dev/null @@ -1,104 +0,0 @@ -{ - "train": { - "log_interval": 100, - "eval_interval": 1000, - "seed": 1234, - "epochs": 1668, - "learning_rate": 0.0001, - "betas": [ - 0.8, - 0.99 - ], - "eps": 1e-09, - "batch_size": 7, - "fp16_run": false, - "bf16_run": false, - "lr_decay": 0.999875, - "segment_size": 10240, - "init_lr_ratio": 1, - "warmup_epochs": 0, - "c_mel": 45, - "c_kl": 1.0, - "use_sr": true, - "max_speclen": 512, - "port": "8001", - "keep_ckpts": 3, - "num_workers": 4, - "log_version": 0, - "ckpt_name_by_step": false, - "accumulate_grad_batches": 1 - }, - "data": { - "training_files": "filelists/44k/train.txt", - "validation_files": "filelists/44k/val.txt", - "max_wav_value": 32768.0, - "sampling_rate": 44100, - "filter_length": 2048, - "hop_length": 512, - "win_length": 2048, - "n_mel_channels": 80, - "mel_fmin": 0.0, - "mel_fmax": 22050, - "contentvec_final_proj": false - }, - "model": { - "inter_channels": 192, - "hidden_channels": 192, - "filter_channels": 768, - "n_heads": 2, - "n_layers": 6, - "kernel_size": 3, - "p_dropout": 0.1, - "resblock": "1", - "resblock_kernel_sizes": [ - 3, - 7, - 11 - ], - "resblock_dilation_sizes": [ - [ - 1, - 3, - 5 - ], - [ - 1, - 3, - 5 - ], - [ - 1, - 3, - 5 - ] - ], - "upsample_rates": [ - 8, - 8, - 2, - 2, - 2 - ], - "upsample_initial_channel": 512, - "upsample_kernel_sizes": [ - 16, - 16, - 4, - 4, - 4 - ], - "n_layers_q": 3, - "use_spectral_norm": false, - "gin_channels": 256, - "ssl_dim": 768, - "n_speakers": 200, - "type_": "hifi-gan", - "pretrained": { - "D_0.pth": "https://huggingface.co/datasets/ms903/sovits4.0-768vec-layer12/resolve/main/sovits_768l12_pre_large_320k/clean_D_320000.pth", - "G_0.pth": "https://huggingface.co/datasets/ms903/sovits4.0-768vec-layer12/resolve/main/sovits_768l12_pre_large_320k/clean_G_320000.pth" - } - }, - "spk": { - "Babs-Seed": 0 - } -} \ No newline at end of file diff --git a/so_vits_svc_4/Babs Seed/kmeans.pt b/so_vits_svc_4/Babs Seed/kmeans.pt deleted file mode 100644 index c4271d4538da2b5a7199c9767864db7b4a600be4..0000000000000000000000000000000000000000 --- a/so_vits_svc_4/Babs Seed/kmeans.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:d8db10039ba64c92555a340f6e2e0c1d8be4bb7365c7aa38996f4b0667915547 -size 9243631 diff --git a/so_vits_svc_4/Big McIntosh/G_1668.pth b/so_vits_svc_4/Big McIntosh/G_1668.pth deleted file mode 100644 index 20468568412014cc64d28b1ac0a8747cb8871be6..0000000000000000000000000000000000000000 --- a/so_vits_svc_4/Big McIntosh/G_1668.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:d04c46333bc2218ab095237496fc9a868f46e723b1c964c7f567a9e66818c0ea -size 548687709 diff --git a/so_vits_svc_4/Big McIntosh/README.txt b/so_vits_svc_4/Big McIntosh/README.txt deleted file mode 100644 index f68638f98fd77a7da412f5f069f2f1a822eb6b57..0000000000000000000000000000000000000000 --- a/so_vits_svc_4/Big McIntosh/README.txt +++ /dev/null @@ -1,4 +0,0 @@ -Originally uploaded by ThunderAnon: -https://drive.google.com/drive/folders/1F0_Idv8G3s0R7RWxF_PctdxnAWUeyH_C?usp=sharing -Each zip and rar file in that link contained a large D_.pth file which is not needed for inference, -so I have reuploaded just the necessary files to the reduce the download time for Hay Say. \ No newline at end of file diff --git a/so_vits_svc_4/Big McIntosh/config.json b/so_vits_svc_4/Big McIntosh/config.json deleted file mode 100644 index c0137967f6ebd27e8dabfb8d28e73d0812421e32..0000000000000000000000000000000000000000 --- a/so_vits_svc_4/Big McIntosh/config.json +++ /dev/null @@ -1,105 +0,0 @@ -{ - "train": { - "log_interval": 100, - "eval_interval": 1000, - "seed": 1234, - "epochs": 1668, - "learning_rate": 0.0001, - "betas": [ - 0.8, - 0.99 - ], - "eps": 1e-09, - "batch_size": 16, - "fp16_run": false, - "bf16_run": false, - "lr_decay": 0.999875, - "segment_size": 10240, - "init_lr_ratio": 1, - "warmup_epochs": 0, - "c_mel": 45, - "c_kl": 1.0, - "use_sr": true, - "max_speclen": 512, - "port": "8001", - "keep_ckpts": 3, - "num_workers": 4, - "log_version": 0, - "ckpt_name_by_step": false, - "accumulate_grad_batches": 1 - }, - "data": { - "training_files": "filelists/44k/train.txt", - "validation_files": "filelists/44k/val.txt", - "max_wav_value": 32768.0, - "sampling_rate": 44100, - "filter_length": 2048, - "hop_length": 512, - "win_length": 2048, - "n_mel_channels": 80, - "mel_fmin": 0.0, - "mel_fmax": 22050, - "contentvec_final_proj": false - }, - "model": { - "inter_channels": 192, - "hidden_channels": 192, - "filter_channels": 768, - "n_heads": 2, - "n_layers": 6, - "kernel_size": 3, - "p_dropout": 0.1, - "resblock": "1", - "resblock_kernel_sizes": [ - 3, - 7, - 11 - ], - "resblock_dilation_sizes": [ - [ - 1, - 3, - 5 - ], - [ - 1, - 3, - 5 - ], - [ - 1, - 3, - 5 - ] - ], - "upsample_rates": [ - 8, - 8, - 2, - 2, - 2 - ], - "upsample_initial_channel": 512, - "upsample_kernel_sizes": [ - 16, - 16, - 4, - 4, - 4 - ], - "n_layers_q": 3, - "use_spectral_norm": false, - "gin_channels": 256, - "ssl_dim": 768, - "n_speakers": 200, - "type_": "hifi-gan", - "pretrained": { - "D_0.pth": "https://huggingface.co/datasets/ms903/sovits4.0-768vec-layer12/resolve/main/sovits_768l12_pre_large_320k/clean_D_320000.pth", - "G_0.pth": "https://huggingface.co/datasets/ms903/sovits4.0-768vec-layer12/resolve/main/sovits_768l12_pre_large_320k/clean_G_320000.pth" - } - }, - "spk": { - "Babs-Seed": 0, - "Big-Mac": 1 - } -} \ No newline at end of file diff --git a/so_vits_svc_4/Big McIntosh/kmeans.pt b/so_vits_svc_4/Big McIntosh/kmeans.pt deleted file mode 100644 index 7baec2116600b7f228de868dc8e1e7aff11cc98f..0000000000000000000000000000000000000000 --- a/so_vits_svc_4/Big McIntosh/kmeans.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:56d36b19a77ec7fb8b6e008f62f64b1be3947cd34326b3728db10c3688e52636 -size 18488879 diff --git a/so_vits_svc_4/Big McIntosh/speaker.json b/so_vits_svc_4/Big McIntosh/speaker.json deleted file mode 100644 index 81f39a442acd6aa17949490a0d2159d3552d9e01..0000000000000000000000000000000000000000 --- a/so_vits_svc_4/Big McIntosh/speaker.json +++ /dev/null @@ -1,3 +0,0 @@ -{ - "speaker": "Big-Mac" -} diff --git a/so_vits_svc_4/Braeburn/G_1668.pth b/so_vits_svc_4/Braeburn/G_1668.pth deleted file mode 100644 index 04574ee729424cba75c9598572b262d3d5203b8d..0000000000000000000000000000000000000000 --- a/so_vits_svc_4/Braeburn/G_1668.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:36483d802d182638f5994eae084367c67622e6fa957c6ba66491fd3f3f1cb45d -size 548687709 diff --git a/so_vits_svc_4/Braeburn/README.txt b/so_vits_svc_4/Braeburn/README.txt deleted file mode 100644 index f68638f98fd77a7da412f5f069f2f1a822eb6b57..0000000000000000000000000000000000000000 --- a/so_vits_svc_4/Braeburn/README.txt +++ /dev/null @@ -1,4 +0,0 @@ -Originally uploaded by ThunderAnon: -https://drive.google.com/drive/folders/1F0_Idv8G3s0R7RWxF_PctdxnAWUeyH_C?usp=sharing -Each zip and rar file in that link contained a large D_.pth file which is not needed for inference, -so I have reuploaded just the necessary files to the reduce the download time for Hay Say. \ No newline at end of file diff --git a/so_vits_svc_4/Braeburn/config.json b/so_vits_svc_4/Braeburn/config.json deleted file mode 100644 index 3d37de1a14cd058dcfacd998cd59416ace2a06e7..0000000000000000000000000000000000000000 --- a/so_vits_svc_4/Braeburn/config.json +++ /dev/null @@ -1,104 +0,0 @@ -{ - "train": { - "log_interval": 100, - "eval_interval": 1000, - "seed": 1234, - "epochs": 1668, - "learning_rate": 0.0001, - "betas": [ - 0.8, - 0.99 - ], - "eps": 1e-09, - "batch_size": 7, - "fp16_run": false, - "bf16_run": false, - "lr_decay": 0.999875, - "segment_size": 10240, - "init_lr_ratio": 1, - "warmup_epochs": 0, - "c_mel": 45, - "c_kl": 1.0, - "use_sr": true, - "max_speclen": 512, - "port": "8001", - "keep_ckpts": 3, - "num_workers": 4, - "log_version": 0, - "ckpt_name_by_step": false, - "accumulate_grad_batches": 1 - }, - "data": { - "training_files": "filelists/44k/train.txt", - "validation_files": "filelists/44k/val.txt", - "max_wav_value": 32768.0, - "sampling_rate": 44100, - "filter_length": 2048, - "hop_length": 512, - "win_length": 2048, - "n_mel_channels": 80, - "mel_fmin": 0.0, - "mel_fmax": 22050, - "contentvec_final_proj": false - }, - "model": { - "inter_channels": 192, - "hidden_channels": 192, - "filter_channels": 768, - "n_heads": 2, - "n_layers": 6, - "kernel_size": 3, - "p_dropout": 0.1, - "resblock": "1", - "resblock_kernel_sizes": [ - 3, - 7, - 11 - ], - "resblock_dilation_sizes": [ - [ - 1, - 3, - 5 - ], - [ - 1, - 3, - 5 - ], - [ - 1, - 3, - 5 - ] - ], - "upsample_rates": [ - 8, - 8, - 2, - 2, - 2 - ], - "upsample_initial_channel": 512, - "upsample_kernel_sizes": [ - 16, - 16, - 4, - 4, - 4 - ], - "n_layers_q": 3, - "use_spectral_norm": false, - "gin_channels": 256, - "ssl_dim": 768, - "n_speakers": 200, - "type_": "hifi-gan", - "pretrained": { - "D_0.pth": "https://huggingface.co/datasets/ms903/sovits4.0-768vec-layer12/resolve/main/sovits_768l12_pre_large_320k/clean_D_320000.pth", - "G_0.pth": "https://huggingface.co/datasets/ms903/sovits4.0-768vec-layer12/resolve/main/sovits_768l12_pre_large_320k/clean_G_320000.pth" - } - }, - "spk": { - "Braeburn": 0 - } -} \ No newline at end of file diff --git a/so_vits_svc_4/Braeburn/kmeans.pt b/so_vits_svc_4/Braeburn/kmeans.pt deleted file mode 100644 index 2a1d19f9108f8f6e9ef3c8f3332e2a4ff14c5d4c..0000000000000000000000000000000000000000 --- a/so_vits_svc_4/Braeburn/kmeans.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:e0086d6d60dc45d6c6bf1803269ee2f847ad5e9eb38b855bdde54d633236f877 -size 9239791 diff --git a/so_vits_svc_4/Cadance (singing, PS1)/speaker.json b/so_vits_svc_4/Cadance (singing, PS1)/speaker.json deleted file mode 100644 index e09703e360a4d3191421355b372ca1b46c536f39..0000000000000000000000000000000000000000 --- a/so_vits_svc_4/Cadance (singing, PS1)/speaker.json +++ /dev/null @@ -1,3 +0,0 @@ -{ - "speaker": "Cadance (singing)" -} diff --git a/so_vits_svc_4/Celestia (singing)/speaker.json b/so_vits_svc_4/Celestia (singing)/speaker.json deleted file mode 100644 index f23661ad88ba803ce58f556397e4f21d75a86393..0000000000000000000000000000000000000000 --- a/so_vits_svc_4/Celestia (singing)/speaker.json +++ /dev/null @@ -1,3 +0,0 @@ -{ - "speaker": "Celestia (singing)" -} diff --git a/so_vits_svc_4/Celestia (singing, PS1)/speaker.json b/so_vits_svc_4/Celestia (singing, PS1)/speaker.json deleted file mode 100644 index f23661ad88ba803ce58f556397e4f21d75a86393..0000000000000000000000000000000000000000 --- a/so_vits_svc_4/Celestia (singing, PS1)/speaker.json +++ /dev/null @@ -1,3 +0,0 @@ -{ - "speaker": "Celestia (singing)" -} diff --git a/so_vits_svc_4/Celestia (singing, alt)/speaker.json b/so_vits_svc_4/Celestia (singing, alt)/speaker.json deleted file mode 100644 index 49298648ffc8f7e0518f8fe40f2fa845249116b4..0000000000000000000000000000000000000000 --- a/so_vits_svc_4/Celestia (singing, alt)/speaker.json +++ /dev/null @@ -1,3 +0,0 @@ -{ - "speaker": "Celestia (singing 2)" -} diff --git a/so_vits_svc_4/Daring Do/speaker.json b/so_vits_svc_4/Daring Do/speaker.json deleted file mode 100644 index 28fbfdd3ea8dffbe3028430e1d282cc9b3eee502..0000000000000000000000000000000000000000 --- a/so_vits_svc_4/Daring Do/speaker.json +++ /dev/null @@ -1,3 +0,0 @@ -{ - "speaker": "ddm_DaringDo" -} \ No newline at end of file diff --git a/so_vits_svc_4/Diamond Tiara/G_6000.pth b/so_vits_svc_4/Diamond Tiara/G_6000.pth deleted file mode 100644 index 796b264a456c78b23718536bd24741e055b5eac6..0000000000000000000000000000000000000000 --- a/so_vits_svc_4/Diamond Tiara/G_6000.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:a545aaa00101ae937f0e9a9f6bbde4a47db057f53a28a28609753318781a844e -size 542789469 diff --git a/so_vits_svc_4/Diamond Tiara/README.txt b/so_vits_svc_4/Diamond Tiara/README.txt deleted file mode 100644 index f68638f98fd77a7da412f5f069f2f1a822eb6b57..0000000000000000000000000000000000000000 --- a/so_vits_svc_4/Diamond Tiara/README.txt +++ /dev/null @@ -1,4 +0,0 @@ -Originally uploaded by ThunderAnon: -https://drive.google.com/drive/folders/1F0_Idv8G3s0R7RWxF_PctdxnAWUeyH_C?usp=sharing -Each zip and rar file in that link contained a large D_.pth file which is not needed for inference, -so I have reuploaded just the necessary files to the reduce the download time for Hay Say. \ No newline at end of file diff --git a/so_vits_svc_4/Diamond Tiara/config.json b/so_vits_svc_4/Diamond Tiara/config.json deleted file mode 100644 index 084e30015a9249edbc3a89e8fb195dfea2c46cac..0000000000000000000000000000000000000000 --- a/so_vits_svc_4/Diamond Tiara/config.json +++ /dev/null @@ -1,98 +0,0 @@ -{ - "train": { - "log_interval": 200, - "eval_interval": 1000, - "seed": 1234, - "epochs": 6000, - "learning_rate": 0.0001, - "betas": [ - 0.8, - 0.99 - ], - "eps": 1e-09, - "batch_size": 7, - "fp16_run": false, - "bf16_run": false, - "lr_decay": 0.999875, - "segment_size": 10240, - "init_lr_ratio": 1, - "warmup_epochs": 0, - "c_mel": 45, - "c_kl": 1.0, - "use_sr": true, - "max_speclen": 512, - "port": "8001", - "keep_ckpts": 3, - "num_workers": 4, - "log_version": 0, - "ckpt_name_by_step": false, - "accumulate_grad_batches": 1 - }, - "data": { - "training_files": "filelists/44k/train.txt", - "validation_files": "filelists/44k/val.txt", - "max_wav_value": 32768.0, - "sampling_rate": 44100, - "filter_length": 2048, - "hop_length": 512, - "win_length": 2048, - "n_mel_channels": 80, - "mel_fmin": 0.0, - "mel_fmax": 22050 - }, - "model": { - "inter_channels": 192, - "hidden_channels": 192, - "filter_channels": 768, - "n_heads": 2, - "n_layers": 6, - "kernel_size": 3, - "p_dropout": 0.1, - "resblock": "1", - "resblock_kernel_sizes": [ - 3, - 7, - 11 - ], - "resblock_dilation_sizes": [ - [ - 1, - 3, - 5 - ], - [ - 1, - 3, - 5 - ], - [ - 1, - 3, - 5 - ] - ], - "upsample_rates": [ - 8, - 8, - 2, - 2, - 2 - ], - "upsample_initial_channel": 512, - "upsample_kernel_sizes": [ - 16, - 16, - 4, - 4, - 4 - ], - "n_layers_q": 3, - "use_spectral_norm": false, - "gin_channels": 256, - "ssl_dim": 256, - "n_speakers": 200 - }, - "spk": { - "Diamond-Tiara": 0 - } -} \ No newline at end of file diff --git a/so_vits_svc_4/Diamond Tiara/kmeans.pt b/so_vits_svc_4/Diamond Tiara/kmeans.pt deleted file mode 100644 index d018f5a9f1af15eb5a085dd527bf17999067a10a..0000000000000000000000000000000000000000 --- a/so_vits_svc_4/Diamond Tiara/kmeans.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:7f8a63da11fb3bd33fca6a51ee9240535cf356d99515e1769ce36d27486f8d82 -size 3083247 diff --git a/so_vits_svc_4/Doctor Whooves/G_1668.pth b/so_vits_svc_4/Doctor Whooves/G_1668.pth deleted file mode 100644 index 367f5e6024ed7a7cdfafa09cc1464cc4aa828234..0000000000000000000000000000000000000000 --- a/so_vits_svc_4/Doctor Whooves/G_1668.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:210052b249f84c72e341f0c03970394ed5d9d807ccb53ec8b7c091e47c4c5f11 -size 180896611 diff --git a/so_vits_svc_4/Doctor Whooves/README.txt b/so_vits_svc_4/Doctor Whooves/README.txt deleted file mode 100644 index f68638f98fd77a7da412f5f069f2f1a822eb6b57..0000000000000000000000000000000000000000 --- a/so_vits_svc_4/Doctor Whooves/README.txt +++ /dev/null @@ -1,4 +0,0 @@ -Originally uploaded by ThunderAnon: -https://drive.google.com/drive/folders/1F0_Idv8G3s0R7RWxF_PctdxnAWUeyH_C?usp=sharing -Each zip and rar file in that link contained a large D_.pth file which is not needed for inference, -so I have reuploaded just the necessary files to the reduce the download time for Hay Say. \ No newline at end of file diff --git a/so_vits_svc_4/Doctor Whooves/config.json b/so_vits_svc_4/Doctor Whooves/config.json deleted file mode 100644 index c76cb752b74428ac878b9751cfc6a331fba80ffd..0000000000000000000000000000000000000000 --- a/so_vits_svc_4/Doctor Whooves/config.json +++ /dev/null @@ -1,98 +0,0 @@ -{ - "train": { - "log_interval": 200, - "eval_interval": 25000, - "seed": 1234, - "epochs": 1668, - "learning_rate": 0.0001, - "betas": [ - 0.8, - 0.99 - ], - "eps": 1e-09, - "batch_size": 16, - "fp16_run": false, - "bf16_run": false, - "lr_decay": 0.999875, - "segment_size": 10240, - "init_lr_ratio": 1, - "warmup_epochs": 0, - "c_mel": 45, - "c_kl": 1.0, - "use_sr": true, - "max_speclen": 512, - "port": "8001", - "keep_ckpts": 3, - "num_workers": 4, - "log_version": 0, - "ckpt_name_by_step": false, - "accumulate_grad_batches": 1 - }, - "data": { - "training_files": "filelists/44k/train.txt", - "validation_files": "filelists/44k/val.txt", - "max_wav_value": 32768.0, - "sampling_rate": 44100, - "filter_length": 2048, - "hop_length": 512, - "win_length": 2048, - "n_mel_channels": 80, - "mel_fmin": 0.0, - "mel_fmax": 22050 - }, - "model": { - "inter_channels": 192, - "hidden_channels": 192, - "filter_channels": 768, - "n_heads": 2, - "n_layers": 6, - "kernel_size": 3, - "p_dropout": 0.1, - "resblock": "1", - "resblock_kernel_sizes": [ - 3, - 7, - 11 - ], - "resblock_dilation_sizes": [ - [ - 1, - 3, - 5 - ], - [ - 1, - 3, - 5 - ], - [ - 1, - 3, - 5 - ] - ], - "upsample_rates": [ - 8, - 8, - 2, - 2, - 2 - ], - "upsample_initial_channel": 512, - "upsample_kernel_sizes": [ - 16, - 16, - 4, - 4, - 4 - ], - "n_layers_q": 3, - "use_spectral_norm": false, - "gin_channels": 256, - "ssl_dim": 256, - "n_speakers": 200 - }, - "spk": { - "Doctor_Whooves": 0 - } -} \ No newline at end of file diff --git a/so_vits_svc_4/Flam/speaker.json b/so_vits_svc_4/Flam/speaker.json deleted file mode 100644 index ff8d148204d3a8e92485611eedb1c79c8e25a194..0000000000000000000000000000000000000000 --- a/so_vits_svc_4/Flam/speaker.json +++ /dev/null @@ -1,3 +0,0 @@ -{ - "speaker": "Flam" -} \ No newline at end of file diff --git a/so_vits_svc_4/Flim/speaker.json b/so_vits_svc_4/Flim/speaker.json deleted file mode 100644 index 78900bb89eef3488bdd1e3637a816e023b4e936a..0000000000000000000000000000000000000000 --- a/so_vits_svc_4/Flim/speaker.json +++ /dev/null @@ -1,3 +0,0 @@ -{ - "speaker": "Flim" -} \ No newline at end of file diff --git a/so_vits_svc_4/Fluttershy (singing, PS1)/speaker.json b/so_vits_svc_4/Fluttershy (singing, PS1)/speaker.json deleted file mode 100644 index 936cecfdf4778d53482e61982b5ad3d73903a52c..0000000000000000000000000000000000000000 --- a/so_vits_svc_4/Fluttershy (singing, PS1)/speaker.json +++ /dev/null @@ -1,3 +0,0 @@ -{ - "speaker": "Fluttershy (singing)" -} diff --git a/so_vits_svc_4/Gallus/G_10000.pth b/so_vits_svc_4/Gallus/G_10000.pth deleted file mode 100644 index e274028c67e7cfe190671d625db3160e3768eb47..0000000000000000000000000000000000000000 --- a/so_vits_svc_4/Gallus/G_10000.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:ecd3b13e2eab233d1e659ecb8d5138f29bb42af40df6c1c99fcfef510acb9e72 -size 542789469 diff --git a/so_vits_svc_4/Gallus/README.txt b/so_vits_svc_4/Gallus/README.txt deleted file mode 100644 index f68638f98fd77a7da412f5f069f2f1a822eb6b57..0000000000000000000000000000000000000000 --- a/so_vits_svc_4/Gallus/README.txt +++ /dev/null @@ -1,4 +0,0 @@ -Originally uploaded by ThunderAnon: -https://drive.google.com/drive/folders/1F0_Idv8G3s0R7RWxF_PctdxnAWUeyH_C?usp=sharing -Each zip and rar file in that link contained a large D_.pth file which is not needed for inference, -so I have reuploaded just the necessary files to the reduce the download time for Hay Say. \ No newline at end of file diff --git a/so_vits_svc_4/Gallus/config.json b/so_vits_svc_4/Gallus/config.json deleted file mode 100644 index 5bdc9a3244fcd92d0a75868fdbf1e4790a99c299..0000000000000000000000000000000000000000 --- a/so_vits_svc_4/Gallus/config.json +++ /dev/null @@ -1,98 +0,0 @@ -{ - "train": { - "log_interval": 200, - "eval_interval": 25000, - "seed": 1234, - "epochs": 10000, - "learning_rate": 0.0001, - "betas": [ - 0.8, - 0.99 - ], - "eps": 1e-09, - "batch_size": 16, - "fp16_run": false, - "bf16_run": false, - "lr_decay": 0.999875, - "segment_size": 10240, - "init_lr_ratio": 1, - "warmup_epochs": 0, - "c_mel": 45, - "c_kl": 1.0, - "use_sr": true, - "max_speclen": 512, - "port": "8001", - "keep_ckpts": 3, - "num_workers": 4, - "log_version": 0, - "ckpt_name_by_step": false, - "accumulate_grad_batches": 1 - }, - "data": { - "training_files": "filelists/44k/train.txt", - "validation_files": "filelists/44k/val.txt", - "max_wav_value": 32768.0, - "sampling_rate": 44100, - "filter_length": 2048, - "hop_length": 512, - "win_length": 2048, - "n_mel_channels": 80, - "mel_fmin": 0.0, - "mel_fmax": 22050 - }, - "model": { - "inter_channels": 192, - "hidden_channels": 192, - "filter_channels": 768, - "n_heads": 2, - "n_layers": 6, - "kernel_size": 3, - "p_dropout": 0.1, - "resblock": "1", - "resblock_kernel_sizes": [ - 3, - 7, - 11 - ], - "resblock_dilation_sizes": [ - [ - 1, - 3, - 5 - ], - [ - 1, - 3, - 5 - ], - [ - 1, - 3, - 5 - ] - ], - "upsample_rates": [ - 8, - 8, - 2, - 2, - 2 - ], - "upsample_initial_channel": 512, - "upsample_kernel_sizes": [ - 16, - 16, - 4, - 4, - 4 - ], - "n_layers_q": 3, - "use_spectral_norm": false, - "gin_channels": 256, - "ssl_dim": 256, - "n_speakers": 200 - }, - "spk": { - "Gallus": 0 - } -} \ No newline at end of file diff --git a/so_vits_svc_4/Lightning Dust/speaker.json b/so_vits_svc_4/Lightning Dust/speaker.json deleted file mode 100644 index 6a34b06164bae4bed726314ac3fac295cf183eb8..0000000000000000000000000000000000000000 --- a/so_vits_svc_4/Lightning Dust/speaker.json +++ /dev/null @@ -1,3 +0,0 @@ -{ - "speaker": "ddm_LightningDust" -} \ No newline at end of file diff --git a/so_vits_svc_4/Luna (singing, PS1)/speaker.json b/so_vits_svc_4/Luna (singing, PS1)/speaker.json deleted file mode 100644 index 1425975cc94a7f4ddc990a2b0f839ea186dc1c9c..0000000000000000000000000000000000000000 --- a/so_vits_svc_4/Luna (singing, PS1)/speaker.json +++ /dev/null @@ -1,3 +0,0 @@ -{ - "speaker": "Luna (singing)" -} diff --git a/so_vits_svc_4/Moon Dancer/speaker.json b/so_vits_svc_4/Moon Dancer/speaker.json deleted file mode 100644 index 2449e47649bce682a2258928d1a47dc02323f4bc..0000000000000000000000000000000000000000 --- a/so_vits_svc_4/Moon Dancer/speaker.json +++ /dev/null @@ -1,3 +0,0 @@ -{ - "speaker": "ddm_Moondancer" -} \ No newline at end of file diff --git a/so_vits_svc_4/Ocellus/G_1668.pth b/so_vits_svc_4/Ocellus/G_1668.pth deleted file mode 100644 index ebf7dd67bd5319fc79884df4e3c5184f7f2c060f..0000000000000000000000000000000000000000 --- a/so_vits_svc_4/Ocellus/G_1668.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:bce86b0dd26db1109bed9f4dcd9a0f40b0f9dc8e77fe8ac21f59f77fced352b3 -size 548687709 diff --git a/so_vits_svc_4/Ocellus/Readme.txt b/so_vits_svc_4/Ocellus/Readme.txt deleted file mode 100644 index f68638f98fd77a7da412f5f069f2f1a822eb6b57..0000000000000000000000000000000000000000 --- a/so_vits_svc_4/Ocellus/Readme.txt +++ /dev/null @@ -1,4 +0,0 @@ -Originally uploaded by ThunderAnon: -https://drive.google.com/drive/folders/1F0_Idv8G3s0R7RWxF_PctdxnAWUeyH_C?usp=sharing -Each zip and rar file in that link contained a large D_.pth file which is not needed for inference, -so I have reuploaded just the necessary files to the reduce the download time for Hay Say. \ No newline at end of file diff --git a/so_vits_svc_4/Ocellus/config.json b/so_vits_svc_4/Ocellus/config.json deleted file mode 100644 index 37440b66b706fc7730bb730280943e1fc7fc7a9b..0000000000000000000000000000000000000000 --- a/so_vits_svc_4/Ocellus/config.json +++ /dev/null @@ -1,104 +0,0 @@ -{ - "train": { - "log_interval": 100, - "eval_interval": 1000, - "seed": 1234, - "epochs": 1668, - "learning_rate": 0.0001, - "betas": [ - 0.8, - 0.99 - ], - "eps": 1e-09, - "batch_size": 7, - "fp16_run": false, - "bf16_run": false, - "lr_decay": 0.999875, - "segment_size": 10240, - "init_lr_ratio": 1, - "warmup_epochs": 0, - "c_mel": 45, - "c_kl": 1.0, - "use_sr": true, - "max_speclen": 512, - "port": "8001", - "keep_ckpts": 3, - "num_workers": 4, - "log_version": 0, - "ckpt_name_by_step": false, - "accumulate_grad_batches": 1 - }, - "data": { - "training_files": "filelists/44k/train.txt", - "validation_files": "filelists/44k/val.txt", - "max_wav_value": 32768.0, - "sampling_rate": 44100, - "filter_length": 2048, - "hop_length": 512, - "win_length": 2048, - "n_mel_channels": 80, - "mel_fmin": 0.0, - "mel_fmax": 22050, - "contentvec_final_proj": false - }, - "model": { - "inter_channels": 192, - "hidden_channels": 192, - "filter_channels": 768, - "n_heads": 2, - "n_layers": 6, - "kernel_size": 3, - "p_dropout": 0.1, - "resblock": "1", - "resblock_kernel_sizes": [ - 3, - 7, - 11 - ], - "resblock_dilation_sizes": [ - [ - 1, - 3, - 5 - ], - [ - 1, - 3, - 5 - ], - [ - 1, - 3, - 5 - ] - ], - "upsample_rates": [ - 8, - 8, - 2, - 2, - 2 - ], - "upsample_initial_channel": 512, - "upsample_kernel_sizes": [ - 16, - 16, - 4, - 4, - 4 - ], - "n_layers_q": 3, - "use_spectral_norm": false, - "gin_channels": 256, - "ssl_dim": 768, - "n_speakers": 200, - "type_": "hifi-gan", - "pretrained": { - "D_0.pth": "https://huggingface.co/datasets/ms903/sovits4.0-768vec-layer12/resolve/main/sovits_768l12_pre_large_320k/clean_D_320000.pth", - "G_0.pth": "https://huggingface.co/datasets/ms903/sovits4.0-768vec-layer12/resolve/main/sovits_768l12_pre_large_320k/clean_G_320000.pth" - } - }, - "spk": { - "Ocellus": 0 - } -} \ No newline at end of file diff --git a/so_vits_svc_4/Ocellus/kmeans.pt b/so_vits_svc_4/Ocellus/kmeans.pt deleted file mode 100644 index 38d98452c9959c728fce2795eef6198028973486..0000000000000000000000000000000000000000 --- a/so_vits_svc_4/Ocellus/kmeans.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:34a5c5b2bbdf005849dfc3d505a728b8be25a0e8bac5be5e04d54eb3c6f4ed6b -size 9242991 diff --git a/so_vits_svc_4/Pinkie Pie (angry)/speaker.json b/so_vits_svc_4/Pinkie Pie (angry)/speaker.json deleted file mode 100644 index af97d2a83d9a233eca041e66682d3ee3aca963cb..0000000000000000000000000000000000000000 --- a/so_vits_svc_4/Pinkie Pie (angry)/speaker.json +++ /dev/null @@ -1,3 +0,0 @@ -{ - "speaker": "Pinkie {angry}" -} \ No newline at end of file diff --git a/so_vits_svc_4/Pinkie Pie (annoyed)/speaker.json b/so_vits_svc_4/Pinkie Pie (annoyed)/speaker.json deleted file mode 100644 index cbbdb1c0040db6ae604cd2520101efb01258e6d9..0000000000000000000000000000000000000000 --- a/so_vits_svc_4/Pinkie Pie (annoyed)/speaker.json +++ /dev/null @@ -1,3 +0,0 @@ -{ - "speaker": "Pinkie {annoyed}" -} \ No newline at end of file diff --git a/so_vits_svc_4/Pinkie Pie (anxious)/speaker.json b/so_vits_svc_4/Pinkie Pie (anxious)/speaker.json deleted file mode 100644 index 88314fddc4fa1277862cd0c2a0bb86cd65634fe6..0000000000000000000000000000000000000000 --- a/so_vits_svc_4/Pinkie Pie (anxious)/speaker.json +++ /dev/null @@ -1,3 +0,0 @@ -{ - "speaker": "Pinkie {anxious}" -} \ No newline at end of file diff --git a/so_vits_svc_4/Pinkie Pie (fearful)/speaker.json b/so_vits_svc_4/Pinkie Pie (fearful)/speaker.json deleted file mode 100644 index 16622e493bd114f4f9f12b86caa4c449a41817b4..0000000000000000000000000000000000000000 --- a/so_vits_svc_4/Pinkie Pie (fearful)/speaker.json +++ /dev/null @@ -1,3 +0,0 @@ -{ - "speaker": "Pinkie {fear}" -} \ No newline at end of file diff --git a/so_vits_svc_4/Pinkie Pie (happy)/speaker.json b/so_vits_svc_4/Pinkie Pie (happy)/speaker.json deleted file mode 100644 index 1cce4321bd9bdb9f46272a8b7b335e784ff67383..0000000000000000000000000000000000000000 --- a/so_vits_svc_4/Pinkie Pie (happy)/speaker.json +++ /dev/null @@ -1,3 +0,0 @@ -{ - "speaker": "Pinkie {happy}" -} \ No newline at end of file diff --git a/so_vits_svc_4/Pinkie Pie (neutral)/speaker.json b/so_vits_svc_4/Pinkie Pie (neutral)/speaker.json deleted file mode 100644 index a4ab0d7ef362ff32bc78fcdda3d7569ea4a8f775..0000000000000000000000000000000000000000 --- a/so_vits_svc_4/Pinkie Pie (neutral)/speaker.json +++ /dev/null @@ -1,3 +0,0 @@ -{ - "speaker": "Pinkie {neutral}" -} \ No newline at end of file diff --git a/so_vits_svc_4/Pinkie Pie (nonverbal)/speaker.json b/so_vits_svc_4/Pinkie Pie (nonverbal)/speaker.json deleted file mode 100644 index f071aa378fce8412b6448faa9ea7b0c12d4fb444..0000000000000000000000000000000000000000 --- a/so_vits_svc_4/Pinkie Pie (nonverbal)/speaker.json +++ /dev/null @@ -1,3 +0,0 @@ -{ - "speaker": "Pinkie {nonverbal}" -} \ No newline at end of file diff --git a/so_vits_svc_4/Pinkie Pie (sad shouting)/speaker.json b/so_vits_svc_4/Pinkie Pie (sad shouting)/speaker.json deleted file mode 100644 index 2d28ca15a5aebb8fdc8195bca38f4e7ba27f8874..0000000000000000000000000000000000000000 --- a/so_vits_svc_4/Pinkie Pie (sad shouting)/speaker.json +++ /dev/null @@ -1,3 +0,0 @@ -{ - "speaker": "Pinkie {sad shouting}" -} \ No newline at end of file diff --git a/so_vits_svc_4/Pinkie Pie (sad)/speaker.json b/so_vits_svc_4/Pinkie Pie (sad)/speaker.json deleted file mode 100644 index fcbbbc3ce22fb105b81219893d23272320a37901..0000000000000000000000000000000000000000 --- a/so_vits_svc_4/Pinkie Pie (sad)/speaker.json +++ /dev/null @@ -1,3 +0,0 @@ -{ - "speaker": "Pinkie {sad}" -} \ No newline at end of file diff --git a/so_vits_svc_4/Pinkie Pie (shouting)/speaker.json b/so_vits_svc_4/Pinkie Pie (shouting)/speaker.json deleted file mode 100644 index 328075fc8bf86921f506fe3324d373af6e7df1ed..0000000000000000000000000000000000000000 --- a/so_vits_svc_4/Pinkie Pie (shouting)/speaker.json +++ /dev/null @@ -1,3 +0,0 @@ -{ - "speaker": "Pinkie {shouting}" -} \ No newline at end of file diff --git a/so_vits_svc_4/Pinkie Pie (singing, PS1)/speaker.json b/so_vits_svc_4/Pinkie Pie (singing, PS1)/speaker.json deleted file mode 100644 index e4cc51f29a9061c325b1fd9b75a2f30cf3d4f2ab..0000000000000000000000000000000000000000 --- a/so_vits_svc_4/Pinkie Pie (singing, PS1)/speaker.json +++ /dev/null @@ -1,3 +0,0 @@ -{ - "speaker": "Pinkie Pie (singing)" -} diff --git a/so_vits_svc_4/Pinkie Pie (surprised)/speaker.json b/so_vits_svc_4/Pinkie Pie (surprised)/speaker.json deleted file mode 100644 index 46799bfb7131b315e6efa78f07084222dba74020..0000000000000000000000000000000000000000 --- a/so_vits_svc_4/Pinkie Pie (surprised)/speaker.json +++ /dev/null @@ -1,3 +0,0 @@ -{ - "speaker": "Pinkie {surprised}" -} \ No newline at end of file diff --git a/so_vits_svc_4/Pinkie Pie (tired)/speaker.json b/so_vits_svc_4/Pinkie Pie (tired)/speaker.json deleted file mode 100644 index 22ccaa9836c02daddd0ff7f3e87c0919e4fddea7..0000000000000000000000000000000000000000 --- a/so_vits_svc_4/Pinkie Pie (tired)/speaker.json +++ /dev/null @@ -1,3 +0,0 @@ -{ - "speaker": "Pinkie {tired}" -} \ No newline at end of file diff --git a/so_vits_svc_4/Pinkie Pie (whispering)/speaker.json b/so_vits_svc_4/Pinkie Pie (whispering)/speaker.json deleted file mode 100644 index deb6eef316ac6f7f0c0fc4042fec33a1bba1a4cd..0000000000000000000000000000000000000000 --- a/so_vits_svc_4/Pinkie Pie (whispering)/speaker.json +++ /dev/null @@ -1,3 +0,0 @@ -{ - "speaker": "Pinkie {whispered}" -} \ No newline at end of file diff --git a/so_vits_svc_4/Rainbow Dash (singing, PS1)/speaker.json b/so_vits_svc_4/Rainbow Dash (singing, PS1)/speaker.json deleted file mode 100644 index 76598271ba54d6c354cb3e996656c3f75de8585d..0000000000000000000000000000000000000000 --- a/so_vits_svc_4/Rainbow Dash (singing, PS1)/speaker.json +++ /dev/null @@ -1,3 +0,0 @@ -{ - "speaker": "Rainbow Dash (singing)" -} diff --git a/so_vits_svc_4/Rarity (singing, PS1)/speaker.json b/so_vits_svc_4/Rarity (singing, PS1)/speaker.json deleted file mode 100644 index 673001b2e53b714e3cb83ef3816ccb69f0210972..0000000000000000000000000000000000000000 --- a/so_vits_svc_4/Rarity (singing, PS1)/speaker.json +++ /dev/null @@ -1,3 +0,0 @@ -{ - "speaker": "Rarity (singing)" -} diff --git a/so_vits_svc_4/Sandbar/G_1668.pth b/so_vits_svc_4/Sandbar/G_1668.pth deleted file mode 100644 index af1e9274cca7e5ca89acb36799c8a6ac8d4ddfc0..0000000000000000000000000000000000000000 --- a/so_vits_svc_4/Sandbar/G_1668.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:57939b58d011b2db6c90b78e07c6ee48cc6fffdd421bb916e23efd96c322cd8b -size 548687709 diff --git a/so_vits_svc_4/Sandbar/README.txt b/so_vits_svc_4/Sandbar/README.txt deleted file mode 100644 index f68638f98fd77a7da412f5f069f2f1a822eb6b57..0000000000000000000000000000000000000000 --- a/so_vits_svc_4/Sandbar/README.txt +++ /dev/null @@ -1,4 +0,0 @@ -Originally uploaded by ThunderAnon: -https://drive.google.com/drive/folders/1F0_Idv8G3s0R7RWxF_PctdxnAWUeyH_C?usp=sharing -Each zip and rar file in that link contained a large D_.pth file which is not needed for inference, -so I have reuploaded just the necessary files to the reduce the download time for Hay Say. \ No newline at end of file diff --git a/so_vits_svc_4/Sandbar/config.json b/so_vits_svc_4/Sandbar/config.json deleted file mode 100644 index e3227055ce587eea4b9f6beb1621a4bd4d56fe53..0000000000000000000000000000000000000000 --- a/so_vits_svc_4/Sandbar/config.json +++ /dev/null @@ -1,104 +0,0 @@ -{ - "train": { - "log_interval": 100, - "eval_interval": 1000, - "seed": 1234, - "epochs": 1668, - "learning_rate": 0.0001, - "betas": [ - 0.8, - 0.99 - ], - "eps": 1e-09, - "batch_size": 7, - "fp16_run": false, - "bf16_run": false, - "lr_decay": 0.999875, - "segment_size": 10240, - "init_lr_ratio": 1, - "warmup_epochs": 0, - "c_mel": 45, - "c_kl": 1.0, - "use_sr": true, - "max_speclen": 512, - "port": "8001", - "keep_ckpts": 3, - "num_workers": 4, - "log_version": 0, - "ckpt_name_by_step": false, - "accumulate_grad_batches": 1 - }, - "data": { - "training_files": "filelists/44k/train.txt", - "validation_files": "filelists/44k/val.txt", - "max_wav_value": 32768.0, - "sampling_rate": 44100, - "filter_length": 2048, - "hop_length": 512, - "win_length": 2048, - "n_mel_channels": 80, - "mel_fmin": 0.0, - "mel_fmax": 22050, - "contentvec_final_proj": false - }, - "model": { - "inter_channels": 192, - "hidden_channels": 192, - "filter_channels": 768, - "n_heads": 2, - "n_layers": 6, - "kernel_size": 3, - "p_dropout": 0.1, - "resblock": "1", - "resblock_kernel_sizes": [ - 3, - 7, - 11 - ], - "resblock_dilation_sizes": [ - [ - 1, - 3, - 5 - ], - [ - 1, - 3, - 5 - ], - [ - 1, - 3, - 5 - ] - ], - "upsample_rates": [ - 8, - 8, - 2, - 2, - 2 - ], - "upsample_initial_channel": 512, - "upsample_kernel_sizes": [ - 16, - 16, - 4, - 4, - 4 - ], - "n_layers_q": 3, - "use_spectral_norm": false, - "gin_channels": 256, - "ssl_dim": 768, - "n_speakers": 200, - "type_": "hifi-gan", - "pretrained": { - "D_0.pth": "https://huggingface.co/datasets/ms903/sovits4.0-768vec-layer12/resolve/main/sovits_768l12_pre_large_320k/clean_D_320000.pth", - "G_0.pth": "https://huggingface.co/datasets/ms903/sovits4.0-768vec-layer12/resolve/main/sovits_768l12_pre_large_320k/clean_G_320000.pth" - } - }, - "spk": { - "Sandbar": 0 - } -} \ No newline at end of file diff --git a/so_vits_svc_4/Sandbar/kmeans.pt b/so_vits_svc_4/Sandbar/kmeans.pt deleted file mode 100644 index 44d998a88eaf83a81482a8706301985315febf2b..0000000000000000000000000000000000000000 --- a/so_vits_svc_4/Sandbar/kmeans.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:87ccf23568137b34382f6253a5ff710317ca6bf03cfc75a341e3938fd3d7d8bf -size 9240175 diff --git a/so_vits_svc_4/Scootaloo (singing, PS1)/speaker.json b/so_vits_svc_4/Scootaloo (singing, PS1)/speaker.json deleted file mode 100644 index 18a405a2026cfbfb63a0ff9fa3da494bb3947505..0000000000000000000000000000000000000000 --- a/so_vits_svc_4/Scootaloo (singing, PS1)/speaker.json +++ /dev/null @@ -1,3 +0,0 @@ -{ - "speaker": "Scootaloo (singing)" -} diff --git a/so_vits_svc_4/Scootaloo (singing, alt)/speaker.json b/so_vits_svc_4/Scootaloo (singing, alt)/speaker.json deleted file mode 100644 index 18a405a2026cfbfb63a0ff9fa3da494bb3947505..0000000000000000000000000000000000000000 --- a/so_vits_svc_4/Scootaloo (singing, alt)/speaker.json +++ /dev/null @@ -1,3 +0,0 @@ -{ - "speaker": "Scootaloo (singing)" -} diff --git a/so_vits_svc_4/Silverstream/G_1668.pth b/so_vits_svc_4/Silverstream/G_1668.pth deleted file mode 100644 index 449064a9c492dbb4b031acfaa4d0157413c485f4..0000000000000000000000000000000000000000 --- a/so_vits_svc_4/Silverstream/G_1668.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:3f7d3b316100a46a4e6141f00874bfbe62add061234083a647a83abe868686d6 -size 548687709 diff --git a/so_vits_svc_4/Silverstream/Readme.txt b/so_vits_svc_4/Silverstream/Readme.txt deleted file mode 100644 index 600b0b9ce5a896c62a885c667a2bab2dbc15637e..0000000000000000000000000000000000000000 --- a/so_vits_svc_4/Silverstream/Readme.txt +++ /dev/null @@ -1,4 +0,0 @@ -Originally uploaded by ThunderAnon: -https://drive.google.com/drive/folders/1pyitdHlO2-XOYC6H4iVK7AS5aRDeSuxG?usp=sharing -Each zip and rar file in that link contained a large D_.pth file which is not needed for inference, -so I have reuploaded just the necessary files to the reduce the download time for Hay Say. \ No newline at end of file diff --git a/so_vits_svc_4/Silverstream/config.json b/so_vits_svc_4/Silverstream/config.json deleted file mode 100644 index cc4c82812647d890e9b4cb4da7d2a0ee63de9f64..0000000000000000000000000000000000000000 --- a/so_vits_svc_4/Silverstream/config.json +++ /dev/null @@ -1,104 +0,0 @@ -{ - "train": { - "log_interval": 100, - "eval_interval": 25000, - "seed": 1234, - "epochs": 1668, - "learning_rate": 0.0001, - "betas": [ - 0.8, - 0.99 - ], - "eps": 1e-09, - "batch_size": 7, - "fp16_run": false, - "bf16_run": false, - "lr_decay": 0.999875, - "segment_size": 10240, - "init_lr_ratio": 1, - "warmup_epochs": 0, - "c_mel": 45, - "c_kl": 1.0, - "use_sr": true, - "max_speclen": 512, - "port": "8001", - "keep_ckpts": 3, - "num_workers": 4, - "log_version": 0, - "ckpt_name_by_step": false, - "accumulate_grad_batches": 1 - }, - "data": { - "training_files": "filelists/44k/train.txt", - "validation_files": "filelists/44k/val.txt", - "max_wav_value": 32768.0, - "sampling_rate": 44100, - "filter_length": 2048, - "hop_length": 512, - "win_length": 2048, - "n_mel_channels": 80, - "mel_fmin": 0.0, - "mel_fmax": 22050, - "contentvec_final_proj": false - }, - "model": { - "inter_channels": 192, - "hidden_channels": 192, - "filter_channels": 768, - "n_heads": 2, - "n_layers": 6, - "kernel_size": 3, - "p_dropout": 0.1, - "resblock": "1", - "resblock_kernel_sizes": [ - 3, - 7, - 11 - ], - "resblock_dilation_sizes": [ - [ - 1, - 3, - 5 - ], - [ - 1, - 3, - 5 - ], - [ - 1, - 3, - 5 - ] - ], - "upsample_rates": [ - 8, - 8, - 2, - 2, - 2 - ], - "upsample_initial_channel": 512, - "upsample_kernel_sizes": [ - 16, - 16, - 4, - 4, - 4 - ], - "n_layers_q": 3, - "use_spectral_norm": false, - "gin_channels": 256, - "ssl_dim": 768, - "n_speakers": 200, - "type_": "hifi-gan", - "pretrained": { - "D_0.pth": "https://huggingface.co/datasets/ms903/sovits4.0-768vec-layer12/resolve/main/sovits_768l12_pre_large_320k/clean_D_320000.pth", - "G_0.pth": "https://huggingface.co/datasets/ms903/sovits4.0-768vec-layer12/resolve/main/sovits_768l12_pre_large_320k/clean_G_320000.pth" - } - }, - "spk": { - "Silverstream": 0 - } -} \ No newline at end of file diff --git a/so_vits_svc_4/Silverstream/kmeans.pt b/so_vits_svc_4/Silverstream/kmeans.pt deleted file mode 100644 index 3d7e8ecb56ef69e2689acebe003d778ad93cc321..0000000000000000000000000000000000000000 --- a/so_vits_svc_4/Silverstream/kmeans.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:abccfbd462debc7fd7cc9f245b90c0043009df5831b26564ab495f0403f21a21 -size 9247343 diff --git a/so_vits_svc_4/Smolder/G_1668.pth b/so_vits_svc_4/Smolder/G_1668.pth deleted file mode 100644 index f1ff7673267b7b934c6daa0fcc8b15376544003e..0000000000000000000000000000000000000000 --- a/so_vits_svc_4/Smolder/G_1668.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:3a1616ef8cc1b889662c590d99c591e1ba6872f2661494f4d8535146b5754277 -size 548687709 diff --git a/so_vits_svc_4/Smolder/README.txt b/so_vits_svc_4/Smolder/README.txt deleted file mode 100644 index f68638f98fd77a7da412f5f069f2f1a822eb6b57..0000000000000000000000000000000000000000 --- a/so_vits_svc_4/Smolder/README.txt +++ /dev/null @@ -1,4 +0,0 @@ -Originally uploaded by ThunderAnon: -https://drive.google.com/drive/folders/1F0_Idv8G3s0R7RWxF_PctdxnAWUeyH_C?usp=sharing -Each zip and rar file in that link contained a large D_.pth file which is not needed for inference, -so I have reuploaded just the necessary files to the reduce the download time for Hay Say. \ No newline at end of file diff --git a/so_vits_svc_4/Smolder/config.json b/so_vits_svc_4/Smolder/config.json deleted file mode 100644 index c6a80268a871d46c5a5b692bacbd0826c4d5f54b..0000000000000000000000000000000000000000 --- a/so_vits_svc_4/Smolder/config.json +++ /dev/null @@ -1,104 +0,0 @@ -{ - "train": { - "log_interval": 100, - "eval_interval": 1000, - "seed": 1234, - "epochs": 1668, - "learning_rate": 0.0001, - "betas": [ - 0.8, - 0.99 - ], - "eps": 1e-09, - "batch_size": 7, - "fp16_run": false, - "bf16_run": false, - "lr_decay": 0.999875, - "segment_size": 10240, - "init_lr_ratio": 1, - "warmup_epochs": 0, - "c_mel": 45, - "c_kl": 1.0, - "use_sr": true, - "max_speclen": 512, - "port": "8001", - "keep_ckpts": 3, - "num_workers": 4, - "log_version": 0, - "ckpt_name_by_step": false, - "accumulate_grad_batches": 1 - }, - "data": { - "training_files": "filelists/44k/train.txt", - "validation_files": "filelists/44k/val.txt", - "max_wav_value": 32768.0, - "sampling_rate": 44100, - "filter_length": 2048, - "hop_length": 512, - "win_length": 2048, - "n_mel_channels": 80, - "mel_fmin": 0.0, - "mel_fmax": 22050, - "contentvec_final_proj": false - }, - "model": { - "inter_channels": 192, - "hidden_channels": 192, - "filter_channels": 768, - "n_heads": 2, - "n_layers": 6, - "kernel_size": 3, - "p_dropout": 0.1, - "resblock": "1", - "resblock_kernel_sizes": [ - 3, - 7, - 11 - ], - "resblock_dilation_sizes": [ - [ - 1, - 3, - 5 - ], - [ - 1, - 3, - 5 - ], - [ - 1, - 3, - 5 - ] - ], - "upsample_rates": [ - 8, - 8, - 2, - 2, - 2 - ], - "upsample_initial_channel": 512, - "upsample_kernel_sizes": [ - 16, - 16, - 4, - 4, - 4 - ], - "n_layers_q": 3, - "use_spectral_norm": false, - "gin_channels": 256, - "ssl_dim": 768, - "n_speakers": 200, - "type_": "hifi-gan", - "pretrained": { - "D_0.pth": "https://huggingface.co/datasets/ms903/sovits4.0-768vec-layer12/resolve/main/sovits_768l12_pre_large_320k/clean_D_320000.pth", - "G_0.pth": "https://huggingface.co/datasets/ms903/sovits4.0-768vec-layer12/resolve/main/sovits_768l12_pre_large_320k/clean_G_320000.pth" - } - }, - "spk": { - "Smolder": 0 - } -} \ No newline at end of file diff --git a/so_vits_svc_4/Smolder/kmeans.pt b/so_vits_svc_4/Smolder/kmeans.pt deleted file mode 100644 index d105967bc07c395f5af869a8c79bab64c81ff7a5..0000000000000000000000000000000000000000 --- a/so_vits_svc_4/Smolder/kmeans.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:0ba0c69e3d3194a1890c9a10db1bf60c74d5392797f14d29d93a00ea6b54332b -size 9243183 diff --git a/so_vits_svc_4/Spike/G_1668.pth b/so_vits_svc_4/Spike/G_1668.pth deleted file mode 100644 index 5ff5ecb3d0ba29d42e63e148d13a5ece0dbad94d..0000000000000000000000000000000000000000 --- a/so_vits_svc_4/Spike/G_1668.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:68039e6d50a3f5e2472b6631fe50d0936586db846bb77efc7dc2da071124f044 -size 548687709 diff --git a/so_vits_svc_4/Spike/README.txt b/so_vits_svc_4/Spike/README.txt deleted file mode 100644 index f68638f98fd77a7da412f5f069f2f1a822eb6b57..0000000000000000000000000000000000000000 --- a/so_vits_svc_4/Spike/README.txt +++ /dev/null @@ -1,4 +0,0 @@ -Originally uploaded by ThunderAnon: -https://drive.google.com/drive/folders/1F0_Idv8G3s0R7RWxF_PctdxnAWUeyH_C?usp=sharing -Each zip and rar file in that link contained a large D_.pth file which is not needed for inference, -so I have reuploaded just the necessary files to the reduce the download time for Hay Say. \ No newline at end of file diff --git a/so_vits_svc_4/Spike/config.json b/so_vits_svc_4/Spike/config.json deleted file mode 100644 index e3227055ce587eea4b9f6beb1621a4bd4d56fe53..0000000000000000000000000000000000000000 --- a/so_vits_svc_4/Spike/config.json +++ /dev/null @@ -1,104 +0,0 @@ -{ - "train": { - "log_interval": 100, - "eval_interval": 1000, - "seed": 1234, - "epochs": 1668, - "learning_rate": 0.0001, - "betas": [ - 0.8, - 0.99 - ], - "eps": 1e-09, - "batch_size": 7, - "fp16_run": false, - "bf16_run": false, - "lr_decay": 0.999875, - "segment_size": 10240, - "init_lr_ratio": 1, - "warmup_epochs": 0, - "c_mel": 45, - "c_kl": 1.0, - "use_sr": true, - "max_speclen": 512, - "port": "8001", - "keep_ckpts": 3, - "num_workers": 4, - "log_version": 0, - "ckpt_name_by_step": false, - "accumulate_grad_batches": 1 - }, - "data": { - "training_files": "filelists/44k/train.txt", - "validation_files": "filelists/44k/val.txt", - "max_wav_value": 32768.0, - "sampling_rate": 44100, - "filter_length": 2048, - "hop_length": 512, - "win_length": 2048, - "n_mel_channels": 80, - "mel_fmin": 0.0, - "mel_fmax": 22050, - "contentvec_final_proj": false - }, - "model": { - "inter_channels": 192, - "hidden_channels": 192, - "filter_channels": 768, - "n_heads": 2, - "n_layers": 6, - "kernel_size": 3, - "p_dropout": 0.1, - "resblock": "1", - "resblock_kernel_sizes": [ - 3, - 7, - 11 - ], - "resblock_dilation_sizes": [ - [ - 1, - 3, - 5 - ], - [ - 1, - 3, - 5 - ], - [ - 1, - 3, - 5 - ] - ], - "upsample_rates": [ - 8, - 8, - 2, - 2, - 2 - ], - "upsample_initial_channel": 512, - "upsample_kernel_sizes": [ - 16, - 16, - 4, - 4, - 4 - ], - "n_layers_q": 3, - "use_spectral_norm": false, - "gin_channels": 256, - "ssl_dim": 768, - "n_speakers": 200, - "type_": "hifi-gan", - "pretrained": { - "D_0.pth": "https://huggingface.co/datasets/ms903/sovits4.0-768vec-layer12/resolve/main/sovits_768l12_pre_large_320k/clean_D_320000.pth", - "G_0.pth": "https://huggingface.co/datasets/ms903/sovits4.0-768vec-layer12/resolve/main/sovits_768l12_pre_large_320k/clean_G_320000.pth" - } - }, - "spk": { - "Sandbar": 0 - } -} \ No newline at end of file diff --git a/so_vits_svc_4/Spike/kmeans.pt b/so_vits_svc_4/Spike/kmeans.pt deleted file mode 100644 index 0be67e479a16afb5aa58ee1e8be32b09b2ebf04c..0000000000000000000000000000000000000000 --- a/so_vits_svc_4/Spike/kmeans.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:3034e09ce75cd1a29bafe3f4c5e1756b9b10e2d608d2370229d6b7d62019a01a -size 9240111 diff --git a/so_vits_svc_4/Starlight Glimmer (evil)/speaker.json b/so_vits_svc_4/Starlight Glimmer (evil)/speaker.json deleted file mode 100644 index c349101f2536aecd8c725c714f9d53104b93f11e..0000000000000000000000000000000000000000 --- a/so_vits_svc_4/Starlight Glimmer (evil)/speaker.json +++ /dev/null @@ -1,3 +0,0 @@ -{ - "speaker": "Starlight Glimmer (evil speaking)" -} \ No newline at end of file diff --git a/so_vits_svc_4/Starlight Glimmer (good)/speaker.json b/so_vits_svc_4/Starlight Glimmer (good)/speaker.json deleted file mode 100644 index e6ae34ddf59a0147da6acd3a74b9e88468852e19..0000000000000000000000000000000000000000 --- a/so_vits_svc_4/Starlight Glimmer (good)/speaker.json +++ /dev/null @@ -1,3 +0,0 @@ -{ - "speaker": "Starlight Glimmer (good speaking)" -} \ No newline at end of file diff --git a/so_vits_svc_4/Starlight Glimmer (singing, evil)/speaker.json b/so_vits_svc_4/Starlight Glimmer (singing, evil)/speaker.json deleted file mode 100644 index 73e4450ddff5e0736b0ee3588e8b8b5ccdce3d01..0000000000000000000000000000000000000000 --- a/so_vits_svc_4/Starlight Glimmer (singing, evil)/speaker.json +++ /dev/null @@ -1,3 +0,0 @@ -{ - "speaker": "Starlight Glimmer (evil)" -} diff --git a/so_vits_svc_4/Starlight Glimmer (singing, good)/speaker.json b/so_vits_svc_4/Starlight Glimmer (singing, good)/speaker.json deleted file mode 100644 index 6bbdde3f689fe547da16b8fa3303d75d47400351..0000000000000000000000000000000000000000 --- a/so_vits_svc_4/Starlight Glimmer (singing, good)/speaker.json +++ /dev/null @@ -1,3 +0,0 @@ -{ - "speaker": "Starlight Glimmer (good)" -} diff --git a/so_vits_svc_4/Sunny Starscout/G_1668.pth b/so_vits_svc_4/Sunny Starscout/G_1668.pth deleted file mode 100644 index 357ebee3c348a10b9422adbaa24dec879d79d1ee..0000000000000000000000000000000000000000 --- a/so_vits_svc_4/Sunny Starscout/G_1668.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:b50638d56e729b0eba22290da3c3ac048c2c518f3fa8090c5ebe13ba9f6eaf94 -size 542789469 diff --git a/so_vits_svc_4/Sunny Starscout/README.txt b/so_vits_svc_4/Sunny Starscout/README.txt deleted file mode 100644 index f68638f98fd77a7da412f5f069f2f1a822eb6b57..0000000000000000000000000000000000000000 --- a/so_vits_svc_4/Sunny Starscout/README.txt +++ /dev/null @@ -1,4 +0,0 @@ -Originally uploaded by ThunderAnon: -https://drive.google.com/drive/folders/1F0_Idv8G3s0R7RWxF_PctdxnAWUeyH_C?usp=sharing -Each zip and rar file in that link contained a large D_.pth file which is not needed for inference, -so I have reuploaded just the necessary files to the reduce the download time for Hay Say. \ No newline at end of file diff --git a/so_vits_svc_4/Sunny Starscout/config.json b/so_vits_svc_4/Sunny Starscout/config.json deleted file mode 100644 index 1ccd4fe169f705f00146cad245882b788aaad097..0000000000000000000000000000000000000000 --- a/so_vits_svc_4/Sunny Starscout/config.json +++ /dev/null @@ -1,98 +0,0 @@ -{ - "train": { - "log_interval": 200, - "eval_interval": 25000, - "seed": 1234, - "epochs": 1668, - "learning_rate": 0.0001, - "betas": [ - 0.8, - 0.99 - ], - "eps": 1e-09, - "batch_size": 16, - "fp16_run": false, - "bf16_run": false, - "lr_decay": 0.999875, - "segment_size": 10240, - "init_lr_ratio": 1, - "warmup_epochs": 0, - "c_mel": 45, - "c_kl": 1.0, - "use_sr": true, - "max_speclen": 512, - "port": "8001", - "keep_ckpts": 3, - "num_workers": 4, - "log_version": 0, - "ckpt_name_by_step": false, - "accumulate_grad_batches": 1 - }, - "data": { - "training_files": "filelists/44k/train.txt", - "validation_files": "filelists/44k/val.txt", - "max_wav_value": 32768.0, - "sampling_rate": 44100, - "filter_length": 2048, - "hop_length": 512, - "win_length": 2048, - "n_mel_channels": 80, - "mel_fmin": 0.0, - "mel_fmax": 22050 - }, - "model": { - "inter_channels": 192, - "hidden_channels": 192, - "filter_channels": 768, - "n_heads": 2, - "n_layers": 6, - "kernel_size": 3, - "p_dropout": 0.1, - "resblock": "1", - "resblock_kernel_sizes": [ - 3, - 7, - 11 - ], - "resblock_dilation_sizes": [ - [ - 1, - 3, - 5 - ], - [ - 1, - 3, - 5 - ], - [ - 1, - 3, - 5 - ] - ], - "upsample_rates": [ - 8, - 8, - 2, - 2, - 2 - ], - "upsample_initial_channel": 512, - "upsample_kernel_sizes": [ - 16, - 16, - 4, - 4, - 4 - ], - "n_layers_q": 3, - "use_spectral_norm": false, - "gin_channels": 256, - "ssl_dim": 256, - "n_speakers": 200 - }, - "spk": { - "Sunny": 0 - } -} \ No newline at end of file diff --git a/so_vits_svc_4/Sunny Starscout/kmeans.pt b/so_vits_svc_4/Sunny Starscout/kmeans.pt deleted file mode 100644 index e0303c84ed388b4693df3ee1c142644c4cb463de..0000000000000000000000000000000000000000 --- a/so_vits_svc_4/Sunny Starscout/kmeans.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:76332c18bc3877cdd26a39c3448155a1aefdda44e907f3bcc96311b2724887b1 -size 3087407 diff --git a/so_vits_svc_4/Sweetie Belle (singing, PS1)/speaker.json b/so_vits_svc_4/Sweetie Belle (singing, PS1)/speaker.json deleted file mode 100644 index 623996fac0810b5c2e50a6a6c68362230d89ccab..0000000000000000000000000000000000000000 --- a/so_vits_svc_4/Sweetie Belle (singing, PS1)/speaker.json +++ /dev/null @@ -1,3 +0,0 @@ -{ - "speaker": "Sweetie Belle (singing)" -} diff --git a/so_vits_svc_4/Tempest Shadow/G_1668.pth b/so_vits_svc_4/Tempest Shadow/G_1668.pth deleted file mode 100644 index 0e752341a6d2b633b07599caae54fd8f1d8f56fa..0000000000000000000000000000000000000000 --- a/so_vits_svc_4/Tempest Shadow/G_1668.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:2b0477968545989643e836e1db4d52a3969658638934becb8fd727edc122a354 -size 542789469 diff --git a/so_vits_svc_4/Tempest Shadow/README.txt b/so_vits_svc_4/Tempest Shadow/README.txt deleted file mode 100644 index f68638f98fd77a7da412f5f069f2f1a822eb6b57..0000000000000000000000000000000000000000 --- a/so_vits_svc_4/Tempest Shadow/README.txt +++ /dev/null @@ -1,4 +0,0 @@ -Originally uploaded by ThunderAnon: -https://drive.google.com/drive/folders/1F0_Idv8G3s0R7RWxF_PctdxnAWUeyH_C?usp=sharing -Each zip and rar file in that link contained a large D_.pth file which is not needed for inference, -so I have reuploaded just the necessary files to the reduce the download time for Hay Say. \ No newline at end of file diff --git a/so_vits_svc_4/Tempest Shadow/config.json b/so_vits_svc_4/Tempest Shadow/config.json deleted file mode 100644 index 0f84ea0459a30cba6278aee216db64ef5f7ae251..0000000000000000000000000000000000000000 --- a/so_vits_svc_4/Tempest Shadow/config.json +++ /dev/null @@ -1,98 +0,0 @@ -{ - "train": { - "log_interval": 200, - "eval_interval": 25000, - "seed": 1234, - "epochs": 1668, - "learning_rate": 0.0001, - "betas": [ - 0.8, - 0.99 - ], - "eps": 1e-09, - "batch_size": 16, - "fp16_run": false, - "bf16_run": false, - "lr_decay": 0.999875, - "segment_size": 10240, - "init_lr_ratio": 1, - "warmup_epochs": 0, - "c_mel": 45, - "c_kl": 1.0, - "use_sr": true, - "max_speclen": 512, - "port": "8001", - "keep_ckpts": 3, - "num_workers": 4, - "log_version": 0, - "ckpt_name_by_step": false, - "accumulate_grad_batches": 1 - }, - "data": { - "training_files": "filelists/44k/train.txt", - "validation_files": "filelists/44k/val.txt", - "max_wav_value": 32768.0, - "sampling_rate": 44100, - "filter_length": 2048, - "hop_length": 512, - "win_length": 2048, - "n_mel_channels": 80, - "mel_fmin": 0.0, - "mel_fmax": 22050 - }, - "model": { - "inter_channels": 192, - "hidden_channels": 192, - "filter_channels": 768, - "n_heads": 2, - "n_layers": 6, - "kernel_size": 3, - "p_dropout": 0.1, - "resblock": "1", - "resblock_kernel_sizes": [ - 3, - 7, - 11 - ], - "resblock_dilation_sizes": [ - [ - 1, - 3, - 5 - ], - [ - 1, - 3, - 5 - ], - [ - 1, - 3, - 5 - ] - ], - "upsample_rates": [ - 8, - 8, - 2, - 2, - 2 - ], - "upsample_initial_channel": 512, - "upsample_kernel_sizes": [ - 16, - 16, - 4, - 4, - 4 - ], - "n_layers_q": 3, - "use_spectral_norm": false, - "gin_channels": 256, - "ssl_dim": 256, - "n_speakers": 200 - }, - "spk": { - "TempestShadow": 0 - } -} \ No newline at end of file diff --git a/so_vits_svc_4/Tempest Shadow/kmeans.pt b/so_vits_svc_4/Tempest Shadow/kmeans.pt deleted file mode 100644 index df2dd6250064cf35752fb83246166e0b6b35355c..0000000000000000000000000000000000000000 --- a/so_vits_svc_4/Tempest Shadow/kmeans.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:a299f03df035f4f63ac7f9078da88e5ccb9718f54ade73b076feb803a2823361 -size 3087599 diff --git a/so_vits_svc_4/Thorax/G_1668.pth b/so_vits_svc_4/Thorax/G_1668.pth deleted file mode 100644 index 93a2c92b5d1b851e1dfe32d6bab92efe21d0c5bc..0000000000000000000000000000000000000000 --- a/so_vits_svc_4/Thorax/G_1668.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:b85d379a75871ae5373f00dae556ba4cffd88bd350d885c6fd289b09d231b788 -size 542789469 diff --git a/so_vits_svc_4/Thorax/README.txt b/so_vits_svc_4/Thorax/README.txt deleted file mode 100644 index f68638f98fd77a7da412f5f069f2f1a822eb6b57..0000000000000000000000000000000000000000 --- a/so_vits_svc_4/Thorax/README.txt +++ /dev/null @@ -1,4 +0,0 @@ -Originally uploaded by ThunderAnon: -https://drive.google.com/drive/folders/1F0_Idv8G3s0R7RWxF_PctdxnAWUeyH_C?usp=sharing -Each zip and rar file in that link contained a large D_.pth file which is not needed for inference, -so I have reuploaded just the necessary files to the reduce the download time for Hay Say. \ No newline at end of file diff --git a/so_vits_svc_4/Thorax/config.json b/so_vits_svc_4/Thorax/config.json deleted file mode 100644 index 1caae05358acfe1d0d944781ba08d4c848a286ef..0000000000000000000000000000000000000000 --- a/so_vits_svc_4/Thorax/config.json +++ /dev/null @@ -1,98 +0,0 @@ -{ - "train": { - "log_interval": 200, - "eval_interval": 25000, - "seed": 1234, - "epochs": 1668, - "learning_rate": 0.0001, - "betas": [ - 0.8, - 0.99 - ], - "eps": 1e-09, - "batch_size": 16, - "fp16_run": false, - "bf16_run": false, - "lr_decay": 0.999875, - "segment_size": 10240, - "init_lr_ratio": 1, - "warmup_epochs": 0, - "c_mel": 45, - "c_kl": 1.0, - "use_sr": true, - "max_speclen": 512, - "port": "8001", - "keep_ckpts": 3, - "num_workers": 4, - "log_version": 0, - "ckpt_name_by_step": false, - "accumulate_grad_batches": 1 - }, - "data": { - "training_files": "filelists/44k/train.txt", - "validation_files": "filelists/44k/val.txt", - "max_wav_value": 32768.0, - "sampling_rate": 44100, - "filter_length": 2048, - "hop_length": 512, - "win_length": 2048, - "n_mel_channels": 80, - "mel_fmin": 0.0, - "mel_fmax": 22050 - }, - "model": { - "inter_channels": 192, - "hidden_channels": 192, - "filter_channels": 768, - "n_heads": 2, - "n_layers": 6, - "kernel_size": 3, - "p_dropout": 0.1, - "resblock": "1", - "resblock_kernel_sizes": [ - 3, - 7, - 11 - ], - "resblock_dilation_sizes": [ - [ - 1, - 3, - 5 - ], - [ - 1, - 3, - 5 - ], - [ - 1, - 3, - 5 - ] - ], - "upsample_rates": [ - 8, - 8, - 2, - 2, - 2 - ], - "upsample_initial_channel": 512, - "upsample_kernel_sizes": [ - 16, - 16, - 4, - 4, - 4 - ], - "n_layers_q": 3, - "use_spectral_norm": false, - "gin_channels": 256, - "ssl_dim": 256, - "n_speakers": 200 - }, - "spk": { - "Thorax": 0 - } -} \ No newline at end of file diff --git a/so_vits_svc_4/Thorax/kmeans.pt b/so_vits_svc_4/Thorax/kmeans.pt deleted file mode 100644 index 410b80b72e17e4bd537eca269d8e8849d5953797..0000000000000000000000000000000000000000 --- a/so_vits_svc_4/Thorax/kmeans.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:f5311360bf39bf408780b55969e76d0b319449cdeecc9d4043b73591cd90713a -size 3079919 diff --git a/so_vits_svc_4/Trixie Lulamoon (singing)/speaker.json b/so_vits_svc_4/Trixie Lulamoon (singing)/speaker.json deleted file mode 100644 index 907b6d1b9d7f746c7fdbff31f07375bf04b11ef0..0000000000000000000000000000000000000000 --- a/so_vits_svc_4/Trixie Lulamoon (singing)/speaker.json +++ /dev/null @@ -1,3 +0,0 @@ -{ - "speaker": "Trixie (singing)" -} diff --git a/so_vits_svc_4/Trixie Lulamoon/speaker.json b/so_vits_svc_4/Trixie Lulamoon/speaker.json deleted file mode 100644 index 551419b248f56218db64adf2747cd6e23e6aba6d..0000000000000000000000000000000000000000 --- a/so_vits_svc_4/Trixie Lulamoon/speaker.json +++ /dev/null @@ -1,3 +0,0 @@ -{ - "speaker": "Trixie (speaking)" -} diff --git a/so_vits_svc_4/Twilight Sparkle (singing, PS1)/speaker.json b/so_vits_svc_4/Twilight Sparkle (singing, PS1)/speaker.json deleted file mode 100644 index 27e2adedffe77fdcf33c23880352f08f8d82f199..0000000000000000000000000000000000000000 --- a/so_vits_svc_4/Twilight Sparkle (singing, PS1)/speaker.json +++ /dev/null @@ -1,3 +0,0 @@ -{ - "speaker": "Twilight Sparkle (singing)" -}