update new mix svs model (update ace-opencpop dataset)
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- exp/{svs_train_visinger2_raw_phn_none_mix/images/discriminator_loss.png → svs_stats_raw_phn_none_mix/train/feats_stats.npz} +2 -2
- exp/{svs_train_visinger2_raw_phn_none_mix/images/discriminator_backward_time.png → svs_stats_raw_phn_none_mix/train/pitch_stats.npz} +2 -2
- exp/svs_train_visinger2_raw_phn_none_mix/images/discriminator_fake_loss.png +0 -3
- exp/svs_train_visinger2_raw_phn_none_mix/images/discriminator_forward_time.png +0 -3
- exp/svs_train_visinger2_raw_phn_none_mix/images/discriminator_optim_step_time.png +0 -3
- exp/svs_train_visinger2_raw_phn_none_mix/images/discriminator_real_loss.png +0 -3
- exp/svs_train_visinger2_raw_phn_none_mix/images/discriminator_train_time.png +0 -3
- exp/svs_train_visinger2_raw_phn_none_mix/images/generator_adv_loss.png +0 -3
- exp/svs_train_visinger2_raw_phn_none_mix/images/generator_backward_time.png +0 -3
- exp/svs_train_visinger2_raw_phn_none_mix/images/generator_feat_match_loss.png +0 -3
- exp/svs_train_visinger2_raw_phn_none_mix/images/generator_forward_time.png +0 -3
- exp/svs_train_visinger2_raw_phn_none_mix/images/generator_kl_loss.png +0 -3
- exp/svs_train_visinger2_raw_phn_none_mix/images/generator_loss.png +0 -3
- exp/svs_train_visinger2_raw_phn_none_mix/images/generator_mel_am_loss.png +0 -3
- exp/svs_train_visinger2_raw_phn_none_mix/images/generator_mel_ddsp_loss.png +0 -3
- exp/svs_train_visinger2_raw_phn_none_mix/images/generator_mel_loss.png +0 -3
- exp/svs_train_visinger2_raw_phn_none_mix/images/generator_optim_step_time.png +0 -3
- exp/svs_train_visinger2_raw_phn_none_mix/images/generator_phn_dur_loss.png +0 -3
- exp/svs_train_visinger2_raw_phn_none_mix/images/generator_pitch_loss.png +0 -3
- exp/svs_train_visinger2_raw_phn_none_mix/images/generator_score_dur_loss.png +0 -3
- exp/svs_train_visinger2_raw_phn_none_mix/images/generator_train_time.png +0 -3
- exp/svs_train_visinger2_raw_phn_none_mix/images/gpu_max_cached_mem_GB.png +0 -3
- exp/svs_train_visinger2_raw_phn_none_mix/images/iter_time.png +0 -3
- exp/svs_train_visinger2_raw_phn_none_mix/images/optim0_lr0.png +0 -3
- exp/svs_train_visinger2_raw_phn_none_mix/images/optim1_lr0.png +0 -3
- exp/svs_train_visinger2_raw_phn_none_mix/images/train_time.png +0 -3
- exp/{svs_train_visinger2_raw_phn_none_mix → svs_train_visinger2_spk_embed_lang_raw_phn_none_mix}/500epoch.pth +2 -2
- exp/{svs_train_visinger2_raw_phn_none_mix → svs_train_visinger2_spk_embed_lang_raw_phn_none_mix}/config.yaml +7 -8
- exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/discriminator_backward_time.png +0 -0
- exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/discriminator_fake_loss.png +0 -0
- exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/discriminator_forward_time.png +0 -0
- exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/discriminator_loss.png +0 -0
- exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/discriminator_optim_step_time.png +0 -0
- exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/discriminator_real_loss.png +0 -0
- exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/discriminator_train_time.png +0 -0
- exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_adv_loss.png +0 -0
- exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_backward_time.png +0 -0
- exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_feat_match_loss.png +0 -0
- exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_forward_time.png +0 -0
- exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_kl_loss.png +0 -0
- exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_loss.png +0 -0
- exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_mel_am_loss.png +0 -0
- exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_mel_ddsp_loss.png +0 -0
- exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_mel_loss.png +0 -0
- exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_optim_step_time.png +0 -0
- exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_phn_dur_loss.png +0 -0
- exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_pitch_loss.png +0 -0
- exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_score_dur_loss.png +0 -0
- exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_train_time.png +0 -0
- exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/gpu_max_cached_mem_GB.png +0 -0
exp/{svs_train_visinger2_raw_phn_none_mix/images/discriminator_loss.png → svs_stats_raw_phn_none_mix/train/feats_stats.npz}
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:95cbffa329e7b157b9c3481e7f8442a1867ead3b27518e7649ec486b76a56fab
|
3 |
+
size 1402
|
exp/{svs_train_visinger2_raw_phn_none_mix/images/discriminator_backward_time.png → svs_stats_raw_phn_none_mix/train/pitch_stats.npz}
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:57b5a91ae0d5d359c421e234aadc10c44f3892fb73392cfb1cdb72810afbca1c
|
3 |
+
size 770
|
exp/svs_train_visinger2_raw_phn_none_mix/images/discriminator_fake_loss.png
DELETED
Git LFS Details
|
exp/svs_train_visinger2_raw_phn_none_mix/images/discriminator_forward_time.png
DELETED
Git LFS Details
|
exp/svs_train_visinger2_raw_phn_none_mix/images/discriminator_optim_step_time.png
DELETED
Git LFS Details
|
exp/svs_train_visinger2_raw_phn_none_mix/images/discriminator_real_loss.png
DELETED
Git LFS Details
|
exp/svs_train_visinger2_raw_phn_none_mix/images/discriminator_train_time.png
DELETED
Git LFS Details
|
exp/svs_train_visinger2_raw_phn_none_mix/images/generator_adv_loss.png
DELETED
Git LFS Details
|
exp/svs_train_visinger2_raw_phn_none_mix/images/generator_backward_time.png
DELETED
Git LFS Details
|
exp/svs_train_visinger2_raw_phn_none_mix/images/generator_feat_match_loss.png
DELETED
Git LFS Details
|
exp/svs_train_visinger2_raw_phn_none_mix/images/generator_forward_time.png
DELETED
Git LFS Details
|
exp/svs_train_visinger2_raw_phn_none_mix/images/generator_kl_loss.png
DELETED
Git LFS Details
|
exp/svs_train_visinger2_raw_phn_none_mix/images/generator_loss.png
DELETED
Git LFS Details
|
exp/svs_train_visinger2_raw_phn_none_mix/images/generator_mel_am_loss.png
DELETED
Git LFS Details
|
exp/svs_train_visinger2_raw_phn_none_mix/images/generator_mel_ddsp_loss.png
DELETED
Git LFS Details
|
exp/svs_train_visinger2_raw_phn_none_mix/images/generator_mel_loss.png
DELETED
Git LFS Details
|
exp/svs_train_visinger2_raw_phn_none_mix/images/generator_optim_step_time.png
DELETED
Git LFS Details
|
exp/svs_train_visinger2_raw_phn_none_mix/images/generator_phn_dur_loss.png
DELETED
Git LFS Details
|
exp/svs_train_visinger2_raw_phn_none_mix/images/generator_pitch_loss.png
DELETED
Git LFS Details
|
exp/svs_train_visinger2_raw_phn_none_mix/images/generator_score_dur_loss.png
DELETED
Git LFS Details
|
exp/svs_train_visinger2_raw_phn_none_mix/images/generator_train_time.png
DELETED
Git LFS Details
|
exp/svs_train_visinger2_raw_phn_none_mix/images/gpu_max_cached_mem_GB.png
DELETED
Git LFS Details
|
exp/svs_train_visinger2_raw_phn_none_mix/images/iter_time.png
DELETED
Git LFS Details
|
exp/svs_train_visinger2_raw_phn_none_mix/images/optim0_lr0.png
DELETED
Git LFS Details
|
exp/svs_train_visinger2_raw_phn_none_mix/images/optim1_lr0.png
DELETED
Git LFS Details
|
exp/svs_train_visinger2_raw_phn_none_mix/images/train_time.png
DELETED
Git LFS Details
|
exp/{svs_train_visinger2_raw_phn_none_mix → svs_train_visinger2_spk_embed_lang_raw_phn_none_mix}/500epoch.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c93a08500a8958e48a57dd6780033635d11916de8e1d72a8691124ef2eb95f2a
|
3 |
+
size 448412302
|
exp/{svs_train_visinger2_raw_phn_none_mix → svs_train_visinger2_spk_embed_lang_raw_phn_none_mix}/config.yaml
RENAMED
@@ -1,11 +1,11 @@
|
|
1 |
-
config: conf/tuning/
|
2 |
print_config: false
|
3 |
log_level: INFO
|
4 |
drop_last_iter: false
|
5 |
dry_run: false
|
6 |
iterator_type: sequence
|
7 |
valid_iterator_type: null
|
8 |
-
output_dir: exp/
|
9 |
ngpu: 1
|
10 |
seed: 777
|
11 |
num_workers: 0
|
@@ -224,8 +224,8 @@ token_list:
|
|
224 |
- an@zh
|
225 |
- en@zh
|
226 |
- iou@zh
|
227 |
-
- t@zh
|
228 |
- ou@zh
|
|
|
229 |
- ao@zh
|
230 |
- ong@zh
|
231 |
- iang@zh
|
@@ -319,16 +319,15 @@ feats_extract_conf:
|
|
319 |
fmin: 80
|
320 |
fmax: 22050
|
321 |
n_mels: 80
|
322 |
-
normalize:
|
323 |
-
normalize_conf:
|
324 |
-
stats_file: exp/svs_stats_raw_phn_none_mix/train/feats_stats.npz
|
325 |
svs: vits
|
326 |
svs_conf:
|
327 |
generator_type: visinger2
|
328 |
vocoder_generator_type: visinger2
|
329 |
generator_params:
|
330 |
hidden_channels: 192
|
331 |
-
|
332 |
langs: 3
|
333 |
global_channels: 256
|
334 |
segment_size: 20
|
@@ -538,5 +537,5 @@ energy_normalize_conf: {}
|
|
538 |
required:
|
539 |
- output_dir
|
540 |
- token_list
|
541 |
-
version: '
|
542 |
distributed: false
|
|
|
1 |
+
config: conf/tuning/train_visinger2_spk_embed_lang.yaml
|
2 |
print_config: false
|
3 |
log_level: INFO
|
4 |
drop_last_iter: false
|
5 |
dry_run: false
|
6 |
iterator_type: sequence
|
7 |
valid_iterator_type: null
|
8 |
+
output_dir: exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix
|
9 |
ngpu: 1
|
10 |
seed: 777
|
11 |
num_workers: 0
|
|
|
224 |
- an@zh
|
225 |
- en@zh
|
226 |
- iou@zh
|
|
|
227 |
- ou@zh
|
228 |
+
- t@zh
|
229 |
- ao@zh
|
230 |
- ong@zh
|
231 |
- iang@zh
|
|
|
319 |
fmin: 80
|
320 |
fmax: 22050
|
321 |
n_mels: 80
|
322 |
+
normalize: null
|
323 |
+
normalize_conf: {}
|
|
|
324 |
svs: vits
|
325 |
svs_conf:
|
326 |
generator_type: visinger2
|
327 |
vocoder_generator_type: visinger2
|
328 |
generator_params:
|
329 |
hidden_channels: 192
|
330 |
+
spk_embed_dim: 192
|
331 |
langs: 3
|
332 |
global_channels: 256
|
333 |
segment_size: 20
|
|
|
537 |
required:
|
538 |
- output_dir
|
539 |
- token_list
|
540 |
+
version: '202503'
|
541 |
distributed: false
|
exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/discriminator_backward_time.png
ADDED
![]() |
exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/discriminator_fake_loss.png
ADDED
![]() |
exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/discriminator_forward_time.png
ADDED
![]() |
exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/discriminator_loss.png
ADDED
![]() |
exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/discriminator_optim_step_time.png
ADDED
![]() |
exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/discriminator_real_loss.png
ADDED
![]() |
exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/discriminator_train_time.png
ADDED
![]() |
exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_adv_loss.png
ADDED
![]() |
exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_backward_time.png
ADDED
![]() |
exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_feat_match_loss.png
ADDED
![]() |
exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_forward_time.png
ADDED
![]() |
exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_kl_loss.png
ADDED
![]() |
exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_loss.png
ADDED
![]() |
exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_mel_am_loss.png
ADDED
![]() |
exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_mel_ddsp_loss.png
ADDED
![]() |
exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_mel_loss.png
ADDED
![]() |
exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_optim_step_time.png
ADDED
![]() |
exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_phn_dur_loss.png
ADDED
![]() |
exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_pitch_loss.png
ADDED
![]() |
exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_score_dur_loss.png
ADDED
![]() |
exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_train_time.png
ADDED
![]() |
exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/gpu_max_cached_mem_GB.png
ADDED
![]() |