update new mix svs model (update ace-opencpop dataset)
Browse filesThis view is limited to 50 files because it contains too many changes. See raw diff
- exp/{svs_train_visinger2_raw_phn_none_mix/images/discriminator_loss.png → svs_stats_raw_phn_none_mix/train/feats_stats.npz} +2 -2
- exp/{svs_train_visinger2_raw_phn_none_mix/images/discriminator_backward_time.png → svs_stats_raw_phn_none_mix/train/pitch_stats.npz} +2 -2
- exp/svs_train_visinger2_raw_phn_none_mix/images/discriminator_fake_loss.png +0 -3
- exp/svs_train_visinger2_raw_phn_none_mix/images/discriminator_forward_time.png +0 -3
- exp/svs_train_visinger2_raw_phn_none_mix/images/discriminator_optim_step_time.png +0 -3
- exp/svs_train_visinger2_raw_phn_none_mix/images/discriminator_real_loss.png +0 -3
- exp/svs_train_visinger2_raw_phn_none_mix/images/discriminator_train_time.png +0 -3
- exp/svs_train_visinger2_raw_phn_none_mix/images/generator_adv_loss.png +0 -3
- exp/svs_train_visinger2_raw_phn_none_mix/images/generator_backward_time.png +0 -3
- exp/svs_train_visinger2_raw_phn_none_mix/images/generator_feat_match_loss.png +0 -3
- exp/svs_train_visinger2_raw_phn_none_mix/images/generator_forward_time.png +0 -3
- exp/svs_train_visinger2_raw_phn_none_mix/images/generator_kl_loss.png +0 -3
- exp/svs_train_visinger2_raw_phn_none_mix/images/generator_loss.png +0 -3
- exp/svs_train_visinger2_raw_phn_none_mix/images/generator_mel_am_loss.png +0 -3
- exp/svs_train_visinger2_raw_phn_none_mix/images/generator_mel_ddsp_loss.png +0 -3
- exp/svs_train_visinger2_raw_phn_none_mix/images/generator_mel_loss.png +0 -3
- exp/svs_train_visinger2_raw_phn_none_mix/images/generator_optim_step_time.png +0 -3
- exp/svs_train_visinger2_raw_phn_none_mix/images/generator_phn_dur_loss.png +0 -3
- exp/svs_train_visinger2_raw_phn_none_mix/images/generator_pitch_loss.png +0 -3
- exp/svs_train_visinger2_raw_phn_none_mix/images/generator_score_dur_loss.png +0 -3
- exp/svs_train_visinger2_raw_phn_none_mix/images/generator_train_time.png +0 -3
- exp/svs_train_visinger2_raw_phn_none_mix/images/gpu_max_cached_mem_GB.png +0 -3
- exp/svs_train_visinger2_raw_phn_none_mix/images/iter_time.png +0 -3
- exp/svs_train_visinger2_raw_phn_none_mix/images/optim0_lr0.png +0 -3
- exp/svs_train_visinger2_raw_phn_none_mix/images/optim1_lr0.png +0 -3
- exp/svs_train_visinger2_raw_phn_none_mix/images/train_time.png +0 -3
- exp/{svs_train_visinger2_raw_phn_none_mix → svs_train_visinger2_spk_embed_lang_raw_phn_none_mix}/500epoch.pth +2 -2
- exp/{svs_train_visinger2_raw_phn_none_mix → svs_train_visinger2_spk_embed_lang_raw_phn_none_mix}/config.yaml +7 -8
- exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/discriminator_backward_time.png +0 -0
- exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/discriminator_fake_loss.png +0 -0
- exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/discriminator_forward_time.png +0 -0
- exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/discriminator_loss.png +0 -0
- exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/discriminator_optim_step_time.png +0 -0
- exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/discriminator_real_loss.png +0 -0
- exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/discriminator_train_time.png +0 -0
- exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_adv_loss.png +0 -0
- exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_backward_time.png +0 -0
- exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_feat_match_loss.png +0 -0
- exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_forward_time.png +0 -0
- exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_kl_loss.png +0 -0
- exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_loss.png +0 -0
- exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_mel_am_loss.png +0 -0
- exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_mel_ddsp_loss.png +0 -0
- exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_mel_loss.png +0 -0
- exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_optim_step_time.png +0 -0
- exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_phn_dur_loss.png +0 -0
- exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_pitch_loss.png +0 -0
- exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_score_dur_loss.png +0 -0
- exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_train_time.png +0 -0
- exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/gpu_max_cached_mem_GB.png +0 -0
exp/{svs_train_visinger2_raw_phn_none_mix/images/discriminator_loss.png → svs_stats_raw_phn_none_mix/train/feats_stats.npz}
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:95cbffa329e7b157b9c3481e7f8442a1867ead3b27518e7649ec486b76a56fab
|
| 3 |
+
size 1402
|
exp/{svs_train_visinger2_raw_phn_none_mix/images/discriminator_backward_time.png → svs_stats_raw_phn_none_mix/train/pitch_stats.npz}
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:57b5a91ae0d5d359c421e234aadc10c44f3892fb73392cfb1cdb72810afbca1c
|
| 3 |
+
size 770
|
exp/svs_train_visinger2_raw_phn_none_mix/images/discriminator_fake_loss.png
DELETED
Git LFS Details
|
exp/svs_train_visinger2_raw_phn_none_mix/images/discriminator_forward_time.png
DELETED
Git LFS Details
|
exp/svs_train_visinger2_raw_phn_none_mix/images/discriminator_optim_step_time.png
DELETED
Git LFS Details
|
exp/svs_train_visinger2_raw_phn_none_mix/images/discriminator_real_loss.png
DELETED
Git LFS Details
|
exp/svs_train_visinger2_raw_phn_none_mix/images/discriminator_train_time.png
DELETED
Git LFS Details
|
exp/svs_train_visinger2_raw_phn_none_mix/images/generator_adv_loss.png
DELETED
Git LFS Details
|
exp/svs_train_visinger2_raw_phn_none_mix/images/generator_backward_time.png
DELETED
Git LFS Details
|
exp/svs_train_visinger2_raw_phn_none_mix/images/generator_feat_match_loss.png
DELETED
Git LFS Details
|
exp/svs_train_visinger2_raw_phn_none_mix/images/generator_forward_time.png
DELETED
Git LFS Details
|
exp/svs_train_visinger2_raw_phn_none_mix/images/generator_kl_loss.png
DELETED
Git LFS Details
|
exp/svs_train_visinger2_raw_phn_none_mix/images/generator_loss.png
DELETED
Git LFS Details
|
exp/svs_train_visinger2_raw_phn_none_mix/images/generator_mel_am_loss.png
DELETED
Git LFS Details
|
exp/svs_train_visinger2_raw_phn_none_mix/images/generator_mel_ddsp_loss.png
DELETED
Git LFS Details
|
exp/svs_train_visinger2_raw_phn_none_mix/images/generator_mel_loss.png
DELETED
Git LFS Details
|
exp/svs_train_visinger2_raw_phn_none_mix/images/generator_optim_step_time.png
DELETED
Git LFS Details
|
exp/svs_train_visinger2_raw_phn_none_mix/images/generator_phn_dur_loss.png
DELETED
Git LFS Details
|
exp/svs_train_visinger2_raw_phn_none_mix/images/generator_pitch_loss.png
DELETED
Git LFS Details
|
exp/svs_train_visinger2_raw_phn_none_mix/images/generator_score_dur_loss.png
DELETED
Git LFS Details
|
exp/svs_train_visinger2_raw_phn_none_mix/images/generator_train_time.png
DELETED
Git LFS Details
|
exp/svs_train_visinger2_raw_phn_none_mix/images/gpu_max_cached_mem_GB.png
DELETED
Git LFS Details
|
exp/svs_train_visinger2_raw_phn_none_mix/images/iter_time.png
DELETED
Git LFS Details
|
exp/svs_train_visinger2_raw_phn_none_mix/images/optim0_lr0.png
DELETED
Git LFS Details
|
exp/svs_train_visinger2_raw_phn_none_mix/images/optim1_lr0.png
DELETED
Git LFS Details
|
exp/svs_train_visinger2_raw_phn_none_mix/images/train_time.png
DELETED
Git LFS Details
|
exp/{svs_train_visinger2_raw_phn_none_mix → svs_train_visinger2_spk_embed_lang_raw_phn_none_mix}/500epoch.pth
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c93a08500a8958e48a57dd6780033635d11916de8e1d72a8691124ef2eb95f2a
|
| 3 |
+
size 448412302
|
exp/{svs_train_visinger2_raw_phn_none_mix → svs_train_visinger2_spk_embed_lang_raw_phn_none_mix}/config.yaml
RENAMED
|
@@ -1,11 +1,11 @@
|
|
| 1 |
-
config: conf/tuning/
|
| 2 |
print_config: false
|
| 3 |
log_level: INFO
|
| 4 |
drop_last_iter: false
|
| 5 |
dry_run: false
|
| 6 |
iterator_type: sequence
|
| 7 |
valid_iterator_type: null
|
| 8 |
-
output_dir: exp/
|
| 9 |
ngpu: 1
|
| 10 |
seed: 777
|
| 11 |
num_workers: 0
|
|
@@ -224,8 +224,8 @@ token_list:
|
|
| 224 |
- an@zh
|
| 225 |
- en@zh
|
| 226 |
- iou@zh
|
| 227 |
-
- t@zh
|
| 228 |
- ou@zh
|
|
|
|
| 229 |
- ao@zh
|
| 230 |
- ong@zh
|
| 231 |
- iang@zh
|
|
@@ -319,16 +319,15 @@ feats_extract_conf:
|
|
| 319 |
fmin: 80
|
| 320 |
fmax: 22050
|
| 321 |
n_mels: 80
|
| 322 |
-
normalize:
|
| 323 |
-
normalize_conf:
|
| 324 |
-
stats_file: exp/svs_stats_raw_phn_none_mix/train/feats_stats.npz
|
| 325 |
svs: vits
|
| 326 |
svs_conf:
|
| 327 |
generator_type: visinger2
|
| 328 |
vocoder_generator_type: visinger2
|
| 329 |
generator_params:
|
| 330 |
hidden_channels: 192
|
| 331 |
-
|
| 332 |
langs: 3
|
| 333 |
global_channels: 256
|
| 334 |
segment_size: 20
|
|
@@ -538,5 +537,5 @@ energy_normalize_conf: {}
|
|
| 538 |
required:
|
| 539 |
- output_dir
|
| 540 |
- token_list
|
| 541 |
-
version: '
|
| 542 |
distributed: false
|
|
|
|
| 1 |
+
config: conf/tuning/train_visinger2_spk_embed_lang.yaml
|
| 2 |
print_config: false
|
| 3 |
log_level: INFO
|
| 4 |
drop_last_iter: false
|
| 5 |
dry_run: false
|
| 6 |
iterator_type: sequence
|
| 7 |
valid_iterator_type: null
|
| 8 |
+
output_dir: exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix
|
| 9 |
ngpu: 1
|
| 10 |
seed: 777
|
| 11 |
num_workers: 0
|
|
|
|
| 224 |
- an@zh
|
| 225 |
- en@zh
|
| 226 |
- iou@zh
|
|
|
|
| 227 |
- ou@zh
|
| 228 |
+
- t@zh
|
| 229 |
- ao@zh
|
| 230 |
- ong@zh
|
| 231 |
- iang@zh
|
|
|
|
| 319 |
fmin: 80
|
| 320 |
fmax: 22050
|
| 321 |
n_mels: 80
|
| 322 |
+
normalize: null
|
| 323 |
+
normalize_conf: {}
|
|
|
|
| 324 |
svs: vits
|
| 325 |
svs_conf:
|
| 326 |
generator_type: visinger2
|
| 327 |
vocoder_generator_type: visinger2
|
| 328 |
generator_params:
|
| 329 |
hidden_channels: 192
|
| 330 |
+
spk_embed_dim: 192
|
| 331 |
langs: 3
|
| 332 |
global_channels: 256
|
| 333 |
segment_size: 20
|
|
|
|
| 537 |
required:
|
| 538 |
- output_dir
|
| 539 |
- token_list
|
| 540 |
+
version: '202503'
|
| 541 |
distributed: false
|
exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/discriminator_backward_time.png
ADDED
|
exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/discriminator_fake_loss.png
ADDED
|
exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/discriminator_forward_time.png
ADDED
|
exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/discriminator_loss.png
ADDED
|
exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/discriminator_optim_step_time.png
ADDED
|
exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/discriminator_real_loss.png
ADDED
|
exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/discriminator_train_time.png
ADDED
|
exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_adv_loss.png
ADDED
|
exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_backward_time.png
ADDED
|
exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_feat_match_loss.png
ADDED
|
exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_forward_time.png
ADDED
|
exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_kl_loss.png
ADDED
|
exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_loss.png
ADDED
|
exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_mel_am_loss.png
ADDED
|
exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_mel_ddsp_loss.png
ADDED
|
exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_mel_loss.png
ADDED
|
exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_optim_step_time.png
ADDED
|
exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_phn_dur_loss.png
ADDED
|
exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_pitch_loss.png
ADDED
|
exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_score_dur_loss.png
ADDED
|
exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_train_time.png
ADDED
|
exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/gpu_max_cached_mem_GB.png
ADDED
|