TangRain commited on
Commit
347a041
·
1 Parent(s): 68452cd

update model (fix ace-opencpop)

Browse files
Files changed (30) hide show
  1. exp/svs_stats_raw_phn_none_mix/train/feats_stats.npz +3 -0
  2. exp/svs_stats_raw_phn_none_mix/train/pitch_stats.npz +3 -0
  3. exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/500epoch.pth +3 -0
  4. exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/config.yaml +541 -0
  5. exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/discriminator_backward_time.png +0 -0
  6. exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/discriminator_fake_loss.png +0 -0
  7. exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/discriminator_forward_time.png +0 -0
  8. exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/discriminator_loss.png +0 -0
  9. exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/discriminator_optim_step_time.png +0 -0
  10. exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/discriminator_real_loss.png +0 -0
  11. exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/discriminator_train_time.png +0 -0
  12. exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_adv_loss.png +0 -0
  13. exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_backward_time.png +0 -0
  14. exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_feat_match_loss.png +0 -0
  15. exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_forward_time.png +0 -0
  16. exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_kl_loss.png +0 -0
  17. exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_loss.png +0 -0
  18. exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_mel_am_loss.png +0 -0
  19. exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_mel_ddsp_loss.png +0 -0
  20. exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_mel_loss.png +0 -0
  21. exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_optim_step_time.png +0 -0
  22. exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_phn_dur_loss.png +0 -0
  23. exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_pitch_loss.png +0 -0
  24. exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_score_dur_loss.png +0 -0
  25. exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_train_time.png +0 -0
  26. exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/gpu_max_cached_mem_GB.png +0 -0
  27. exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/iter_time.png +0 -0
  28. exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/optim0_lr0.png +0 -0
  29. exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/optim1_lr0.png +0 -0
  30. exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/train_time.png +0 -0
exp/svs_stats_raw_phn_none_mix/train/feats_stats.npz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:95cbffa329e7b157b9c3481e7f8442a1867ead3b27518e7649ec486b76a56fab
3
+ size 1402
exp/svs_stats_raw_phn_none_mix/train/pitch_stats.npz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:57b5a91ae0d5d359c421e234aadc10c44f3892fb73392cfb1cdb72810afbca1c
3
+ size 770
exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/500epoch.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c93a08500a8958e48a57dd6780033635d11916de8e1d72a8691124ef2eb95f2a
3
+ size 448412302
exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/config.yaml ADDED
@@ -0,0 +1,541 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ config: conf/tuning/train_visinger2_spk_embed_lang.yaml
2
+ print_config: false
3
+ log_level: INFO
4
+ drop_last_iter: false
5
+ dry_run: false
6
+ iterator_type: sequence
7
+ valid_iterator_type: null
8
+ output_dir: exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix
9
+ ngpu: 1
10
+ seed: 777
11
+ num_workers: 0
12
+ num_att_plot: 0
13
+ dist_backend: nccl
14
+ dist_init_method: env://
15
+ dist_world_size: null
16
+ dist_rank: null
17
+ local_rank: 0
18
+ dist_master_addr: null
19
+ dist_master_port: null
20
+ dist_launcher: null
21
+ multiprocessing_distributed: false
22
+ unused_parameters: true
23
+ sharded_ddp: false
24
+ use_deepspeed: false
25
+ deepspeed_config: null
26
+ gradient_as_bucket_view: true
27
+ ddp_comm_hook: null
28
+ cudnn_enabled: true
29
+ cudnn_benchmark: false
30
+ cudnn_deterministic: false
31
+ use_tf32: false
32
+ collect_stats: false
33
+ write_collected_feats: false
34
+ max_epoch: 500
35
+ patience: null
36
+ val_scheduler_criterion:
37
+ - valid
38
+ - loss
39
+ early_stopping_criterion:
40
+ - valid
41
+ - loss
42
+ - min
43
+ best_model_criterion:
44
+ - - train
45
+ - total_count
46
+ - max
47
+ keep_nbest_models: 10
48
+ nbest_averaging_interval: 0
49
+ grad_clip: -1
50
+ grad_clip_type: 2.0
51
+ grad_noise: false
52
+ accum_grad: 1
53
+ no_forward_run: false
54
+ resume: true
55
+ train_dtype: float32
56
+ use_amp: false
57
+ log_interval: 50
58
+ use_matplotlib: true
59
+ use_tensorboard: true
60
+ create_graph_in_tensorboard: false
61
+ use_wandb: false
62
+ wandb_project: null
63
+ wandb_id: null
64
+ wandb_entity: null
65
+ wandb_name: null
66
+ wandb_model_log_interval: -1
67
+ detect_anomaly: false
68
+ use_adapter: false
69
+ adapter: lora
70
+ save_strategy: all
71
+ adapter_conf: {}
72
+ pretrain_path: null
73
+ init_param: []
74
+ ignore_init_mismatch: false
75
+ freeze_param: []
76
+ num_iters_per_epoch: 1000
77
+ batch_size: 8
78
+ valid_batch_size: null
79
+ batch_bins: 1000000
80
+ valid_batch_bins: null
81
+ category_sample_size: 10
82
+ train_shape_file:
83
+ - exp/svs_stats_raw_phn_none_mix/train/text_shape.phn
84
+ - exp/svs_stats_raw_phn_none_mix/train/singing_shape
85
+ valid_shape_file:
86
+ - exp/svs_stats_raw_phn_none_mix/valid/text_shape.phn
87
+ - exp/svs_stats_raw_phn_none_mix/valid/singing_shape
88
+ batch_type: sorted
89
+ valid_batch_type: null
90
+ fold_length:
91
+ - 150
92
+ - 409600
93
+ sort_in_batch: descending
94
+ shuffle_within_batch: false
95
+ sort_batch: descending
96
+ multiple_iterator: false
97
+ chunk_length: 500
98
+ chunk_shift_ratio: 0.5
99
+ num_cache_chunks: 1024
100
+ chunk_excluded_key_prefixes: []
101
+ chunk_default_fs: null
102
+ chunk_max_abs_length: null
103
+ chunk_discard_short_samples: true
104
+ train_data_path_and_name_and_type:
105
+ - - dump_mix/raw/tr_no_dev/text
106
+ - text
107
+ - text
108
+ - - dump_mix/raw/tr_no_dev/wav.scp
109
+ - singing
110
+ - sound
111
+ - - dump_mix/raw/tr_no_dev/label
112
+ - label
113
+ - duration
114
+ - - dump_mix/raw/tr_no_dev/score.scp
115
+ - score
116
+ - score
117
+ - - exp/svs_stats_raw_phn_none_mix/train/collect_feats/pitch.scp
118
+ - pitch
119
+ - npy
120
+ - - exp/svs_stats_raw_phn_none_mix/train/collect_feats/feats.scp
121
+ - feats
122
+ - npy
123
+ - - dump_mix/espnet_spk/tr_no_dev/espnet_spk.scp
124
+ - spembs
125
+ - kaldi_ark
126
+ - - dump_mix/raw/tr_no_dev/utt2sid
127
+ - sids
128
+ - text_int
129
+ - - dump_mix/raw/tr_no_dev/utt2lid
130
+ - lids
131
+ - text_int
132
+ valid_data_path_and_name_and_type:
133
+ - - dump_mix/raw/dev/text
134
+ - text
135
+ - text
136
+ - - dump_mix/raw/dev/wav.scp
137
+ - singing
138
+ - sound
139
+ - - dump_mix/raw/dev/label
140
+ - label
141
+ - duration
142
+ - - dump_mix/raw/dev/score.scp
143
+ - score
144
+ - score
145
+ - - exp/svs_stats_raw_phn_none_mix/valid/collect_feats/pitch.scp
146
+ - pitch
147
+ - npy
148
+ - - exp/svs_stats_raw_phn_none_mix/valid/collect_feats/feats.scp
149
+ - feats
150
+ - npy
151
+ - - dump_mix/espnet_spk/dev/espnet_spk.scp
152
+ - spembs
153
+ - kaldi_ark
154
+ - - dump_mix/raw/dev/utt2sid
155
+ - sids
156
+ - text_int
157
+ - - dump_mix/raw/dev/utt2lid
158
+ - lids
159
+ - text_int
160
+ multi_task_dataset: false
161
+ allow_variable_data_keys: false
162
+ max_cache_size: 0.0
163
+ max_cache_fd: 32
164
+ allow_multi_rates: false
165
+ valid_max_cache_size: null
166
+ exclude_weight_decay: false
167
+ exclude_weight_decay_conf: {}
168
+ optim: adamw
169
+ optim_conf:
170
+ lr: 0.0002
171
+ betas:
172
+ - 0.8
173
+ - 0.99
174
+ eps: 1.0e-09
175
+ weight_decay: 0.0
176
+ scheduler: exponentiallr
177
+ scheduler_conf:
178
+ gamma: 0.998
179
+ optim2: adamw
180
+ optim2_conf:
181
+ lr: 0.0002
182
+ betas:
183
+ - 0.8
184
+ - 0.99
185
+ eps: 1.0e-09
186
+ weight_decay: 0.0
187
+ scheduler2: exponentiallr
188
+ scheduler2_conf:
189
+ gamma: 0.998
190
+ generator_first: true
191
+ skip_discriminator_prob: 0.0
192
+ input_size: null
193
+ token_list:
194
+ - <blank>
195
+ - <unk>
196
+ - SP
197
+ - AP
198
+ - i@zh
199
+ - e@zh
200
+ - d@zh
201
+ - y@zh
202
+ - uo@zh
203
+ - sh@zh
204
+ - ian@zh
205
+ - ai@zh
206
+ - n@zh
207
+ - u@zh
208
+ - w@zh
209
+ - x@zh
210
+ - j@zh
211
+ - l@zh
212
+ - h@zh
213
+ - b@zh
214
+ - iii@zh
215
+ - zh@zh
216
+ - uei@zh
217
+ - m@zh
218
+ - ing@zh
219
+ - q@zh
220
+ - z@zh
221
+ - g@zh
222
+ - eng@zh
223
+ - a@zh
224
+ - an@zh
225
+ - en@zh
226
+ - iou@zh
227
+ - ou@zh
228
+ - t@zh
229
+ - ao@zh
230
+ - ong@zh
231
+ - iang@zh
232
+ - ang@zh
233
+ - ei@zh
234
+ - iao@zh
235
+ - ie@zh
236
+ - f@zh
237
+ - r@zh
238
+ - k@zh
239
+ - ch@zh
240
+ - v@zh
241
+ - in@zh
242
+ - a@jp
243
+ - uan@zh
244
+ - o@jp
245
+ - c@zh
246
+ - i@jp
247
+ - s@zh
248
+ - uang@zh
249
+ - ii@zh
250
+ - van@zh
251
+ - p@zh
252
+ - ve@zh
253
+ - u@jp
254
+ - e@jp
255
+ - ia@zh
256
+ - uen@zh
257
+ - k@jp
258
+ - ua@zh
259
+ - n@jp
260
+ - iong@zh
261
+ - t@jp
262
+ - r@jp
263
+ - uai@zh
264
+ - m@jp
265
+ - er@zh
266
+ - s@jp
267
+ - vn@zh
268
+ - w@jp
269
+ - d@jp
270
+ - N@jp
271
+ - sh@jp
272
+ - g@jp
273
+ - y@jp
274
+ - o@zh
275
+ - b@jp
276
+ - ts@jp
277
+ - h@jp
278
+ - cl@jp
279
+ - z@jp
280
+ - ch@jp
281
+ - j@jp
282
+ - f@jp
283
+ - p@jp
284
+ - ky@jp
285
+ - ry@jp
286
+ - gy@jp
287
+ - ny@jp
288
+ - hy@jp
289
+ - my@jp
290
+ - by@jp
291
+ - py@jp
292
+ - ty@jp
293
+ - dy@jp
294
+ - v@jp
295
+ - <sos/eos>
296
+ odim: null
297
+ model_conf: {}
298
+ use_preprocessor: true
299
+ token_type: phn
300
+ bpemodel: null
301
+ non_linguistic_symbols: null
302
+ cleaner: null
303
+ g2p: null
304
+ fs: 44100
305
+ postfrontend: null
306
+ postfrontend_conf: {}
307
+ score_feats_extract: syllable_score_feats
308
+ score_feats_extract_conf:
309
+ fs: 44100
310
+ n_fft: 2048
311
+ win_length: 2048
312
+ hop_length: 512
313
+ feats_extract: fbank
314
+ feats_extract_conf:
315
+ n_fft: 2048
316
+ hop_length: 512
317
+ win_length: 2048
318
+ fs: 44100
319
+ fmin: 80
320
+ fmax: 22050
321
+ n_mels: 80
322
+ normalize: null
323
+ normalize_conf: {}
324
+ svs: vits
325
+ svs_conf:
326
+ generator_type: visinger2
327
+ vocoder_generator_type: visinger2
328
+ generator_params:
329
+ hidden_channels: 192
330
+ spk_embed_dim: 192
331
+ langs: 3
332
+ global_channels: 256
333
+ segment_size: 20
334
+ text_encoder_attention_heads: 2
335
+ text_encoder_ffn_expand: 4
336
+ text_encoder_blocks: 6
337
+ text_encoder_positionwise_layer_type: conv1d
338
+ text_encoder_positionwise_conv_kernel_size: 3
339
+ text_encoder_positional_encoding_layer_type: rel_pos
340
+ text_encoder_self_attention_layer_type: rel_selfattn
341
+ text_encoder_activation_type: swish
342
+ text_encoder_normalize_before: true
343
+ text_encoder_dropout_rate: 0.1
344
+ text_encoder_positional_dropout_rate: 0.0
345
+ text_encoder_attention_dropout_rate: 0.1
346
+ use_macaron_style_in_text_encoder: true
347
+ use_conformer_conv_in_text_encoder: false
348
+ text_encoder_conformer_kernel_size: -1
349
+ decoder_kernel_size: 7
350
+ decoder_channels: 256
351
+ decoder_upsample_scales:
352
+ - 8
353
+ - 8
354
+ - 4
355
+ - 2
356
+ decoder_upsample_kernel_sizes:
357
+ - 16
358
+ - 16
359
+ - 8
360
+ - 4
361
+ n_harmonic: 64
362
+ decoder_resblock_kernel_sizes:
363
+ - 3
364
+ - 7
365
+ - 11
366
+ decoder_resblock_dilations:
367
+ - - 1
368
+ - 3
369
+ - 5
370
+ - - 1
371
+ - 3
372
+ - 5
373
+ - - 1
374
+ - 3
375
+ - 5
376
+ use_weight_norm_in_decoder: true
377
+ posterior_encoder_kernel_size: 3
378
+ posterior_encoder_layers: 8
379
+ posterior_encoder_stacks: 1
380
+ posterior_encoder_base_dilation: 1
381
+ posterior_encoder_dropout_rate: 0.0
382
+ use_weight_norm_in_posterior_encoder: true
383
+ flow_flows: -1
384
+ flow_kernel_size: 5
385
+ flow_base_dilation: 1
386
+ flow_layers: 4
387
+ flow_dropout_rate: 0.0
388
+ use_weight_norm_in_flow: true
389
+ use_only_mean_in_flow: true
390
+ use_phoneme_predictor: false
391
+ hubert_channels: null
392
+ vocabs: 102
393
+ aux_channels: 80
394
+ generator_type: visinger2
395
+ vocoder_generator_type: visinger2
396
+ fs: 44100
397
+ hop_length: 512
398
+ win_length: 2048
399
+ n_fft: 2048
400
+ discriminator_type: visinger2
401
+ discriminator_params:
402
+ scales: 1
403
+ scale_downsample_pooling: AvgPool1d
404
+ scale_downsample_pooling_params:
405
+ kernel_size: 4
406
+ stride: 2
407
+ padding: 2
408
+ scale_discriminator_params:
409
+ in_channels: 1
410
+ out_channels: 1
411
+ kernel_sizes:
412
+ - 15
413
+ - 41
414
+ - 5
415
+ - 3
416
+ channels: 128
417
+ max_downsample_channels: 1024
418
+ max_groups: 256
419
+ bias: true
420
+ downsample_scales:
421
+ - 4
422
+ - 4
423
+ - 4
424
+ - 4
425
+ nonlinear_activation: LeakyReLU
426
+ nonlinear_activation_params:
427
+ negative_slope: 0.1
428
+ use_weight_norm: true
429
+ use_spectral_norm: false
430
+ follow_official_norm: false
431
+ periods:
432
+ - 2
433
+ - 3
434
+ - 5
435
+ - 7
436
+ - 11
437
+ period_discriminator_params:
438
+ in_channels: 1
439
+ out_channels: 1
440
+ kernel_sizes:
441
+ - 5
442
+ - 3
443
+ channels: 32
444
+ downsample_scales:
445
+ - 3
446
+ - 3
447
+ - 3
448
+ - 3
449
+ - 1
450
+ max_downsample_channels: 1024
451
+ bias: true
452
+ nonlinear_activation: LeakyReLU
453
+ nonlinear_activation_params:
454
+ negative_slope: 0.1
455
+ use_weight_norm: true
456
+ use_spectral_norm: false
457
+ multi_freq_disc_params:
458
+ hidden_channels:
459
+ - 256
460
+ - 256
461
+ - 256
462
+ - 256
463
+ - 256
464
+ domain: double
465
+ mel_scale: true
466
+ divisors:
467
+ - 32
468
+ - 16
469
+ - 8
470
+ - 4
471
+ - 2
472
+ - 1
473
+ - 1
474
+ strides:
475
+ - 1
476
+ - 2
477
+ - 1
478
+ - 2
479
+ - 1
480
+ - 2
481
+ - 1
482
+ sample_rate: 44100
483
+ hop_lengths:
484
+ - 110
485
+ - 220
486
+ - 330
487
+ - 441
488
+ - 551
489
+ - 661
490
+ generator_adv_loss_params:
491
+ average_by_discriminators: false
492
+ loss_type: mse
493
+ discriminator_adv_loss_params:
494
+ average_by_discriminators: false
495
+ loss_type: mse
496
+ feat_match_loss_params:
497
+ average_by_discriminators: false
498
+ average_by_layers: false
499
+ include_final_outputs: true
500
+ mel_loss_params:
501
+ fs: 44100
502
+ n_fft: 2048
503
+ hop_length: 512
504
+ win_length: 2048
505
+ window: hann
506
+ n_mels: 80
507
+ fmin: 0
508
+ fmax: 22050
509
+ log_base: null
510
+ lambda_adv: 1.0
511
+ lambda_mel: 45.0
512
+ lambda_feat_match: 2.0
513
+ lambda_dur: 0.1
514
+ lambda_pitch: 10.0
515
+ lambda_phoneme: 1.0
516
+ lambda_kl: 1.0
517
+ sampling_rate: 44100
518
+ cache_generator_outputs: true
519
+ pitch_extract: dio
520
+ pitch_extract_conf:
521
+ use_token_averaged_f0: false
522
+ use_log_f0: false
523
+ fs: 44100
524
+ n_fft: 2048
525
+ hop_length: 512
526
+ f0max: 810
527
+ f0min: 80
528
+ pitch_normalize: null
529
+ pitch_normalize_conf:
530
+ stats_file: exp/svs_stats_raw_phn_none_mix/train/pitch_stats.npz
531
+ ying_extract: null
532
+ ying_extract_conf: {}
533
+ energy_extract: null
534
+ energy_extract_conf: {}
535
+ energy_normalize: null
536
+ energy_normalize_conf: {}
537
+ required:
538
+ - output_dir
539
+ - token_list
540
+ version: '202503'
541
+ distributed: false
exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/discriminator_backward_time.png ADDED
exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/discriminator_fake_loss.png ADDED
exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/discriminator_forward_time.png ADDED
exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/discriminator_loss.png ADDED
exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/discriminator_optim_step_time.png ADDED
exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/discriminator_real_loss.png ADDED
exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/discriminator_train_time.png ADDED
exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_adv_loss.png ADDED
exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_backward_time.png ADDED
exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_feat_match_loss.png ADDED
exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_forward_time.png ADDED
exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_kl_loss.png ADDED
exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_loss.png ADDED
exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_mel_am_loss.png ADDED
exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_mel_ddsp_loss.png ADDED
exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_mel_loss.png ADDED
exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_optim_step_time.png ADDED
exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_phn_dur_loss.png ADDED
exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_pitch_loss.png ADDED
exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_score_dur_loss.png ADDED
exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_train_time.png ADDED
exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/gpu_max_cached_mem_GB.png ADDED
exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/iter_time.png ADDED
exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/optim0_lr0.png ADDED
exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/optim1_lr0.png ADDED
exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/train_time.png ADDED