diff --git a/exp/svs_stats_raw_phn_none_mix/train/feats_stats.npz b/exp/svs_stats_raw_phn_none_mix/train/feats_stats.npz new file mode 100644 index 0000000000000000000000000000000000000000..0cec0c5573194020f775c100ed23a55a15ebca0d --- /dev/null +++ b/exp/svs_stats_raw_phn_none_mix/train/feats_stats.npz @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95cbffa329e7b157b9c3481e7f8442a1867ead3b27518e7649ec486b76a56fab +size 1402 diff --git a/exp/svs_stats_raw_phn_none_mix/train/pitch_stats.npz b/exp/svs_stats_raw_phn_none_mix/train/pitch_stats.npz new file mode 100644 index 0000000000000000000000000000000000000000..81205d2fc4226edd6870b4bf815d79cf4c56f2fd --- /dev/null +++ b/exp/svs_stats_raw_phn_none_mix/train/pitch_stats.npz @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:57b5a91ae0d5d359c421e234aadc10c44f3892fb73392cfb1cdb72810afbca1c +size 770 diff --git a/exp/svs_train_visinger2_raw_phn_none_mix/500epoch.pth b/exp/svs_train_visinger2_raw_phn_none_mix/500epoch.pth deleted file mode 100644 index 6d863e9a3a8c0ac021efefe2efc6604a99a933ad..0000000000000000000000000000000000000000 --- a/exp/svs_train_visinger2_raw_phn_none_mix/500epoch.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:2c2d019f47dce46ab6f9022606ba4d02365a39ba090093db562ec7f5ba0edd22 -size 448311886 diff --git a/exp/svs_train_visinger2_raw_phn_none_mix/images/discriminator_backward_time.png b/exp/svs_train_visinger2_raw_phn_none_mix/images/discriminator_backward_time.png deleted file mode 100644 index 696b547dcc061db6273b9868c746ab51ffd5c70b..0000000000000000000000000000000000000000 --- a/exp/svs_train_visinger2_raw_phn_none_mix/images/discriminator_backward_time.png +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:87c466c2258086564e173d691d245d8ed1a02d6baf873df3d2d58bc5f9b61090 -size 49691 diff --git a/exp/svs_train_visinger2_raw_phn_none_mix/images/discriminator_fake_loss.png b/exp/svs_train_visinger2_raw_phn_none_mix/images/discriminator_fake_loss.png deleted file mode 100644 index 16f64beafcaa6220d166278240693cde05731126..0000000000000000000000000000000000000000 --- a/exp/svs_train_visinger2_raw_phn_none_mix/images/discriminator_fake_loss.png +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:2e13b134b81e5fbe422facdacb4f902d9bfcb100b9af0db37d7679c39f2f0d3d -size 70285 diff --git a/exp/svs_train_visinger2_raw_phn_none_mix/images/discriminator_forward_time.png b/exp/svs_train_visinger2_raw_phn_none_mix/images/discriminator_forward_time.png deleted file mode 100644 index 8eddd04d6d9c12584c843d7c0939879422f5026e..0000000000000000000000000000000000000000 --- a/exp/svs_train_visinger2_raw_phn_none_mix/images/discriminator_forward_time.png +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:dabc6c55d6feccd80ce843f648ea8e93a3449910df4ed9e7cbd0976d7d4a72f1 -size 50486 diff --git a/exp/svs_train_visinger2_raw_phn_none_mix/images/discriminator_loss.png b/exp/svs_train_visinger2_raw_phn_none_mix/images/discriminator_loss.png deleted file mode 100644 index 2f140b0d9bb37f78192e37d01b8ec50e69226544..0000000000000000000000000000000000000000 --- a/exp/svs_train_visinger2_raw_phn_none_mix/images/discriminator_loss.png +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:0128375cff96feefa7bc083a580522796dc8abd9a301b94f0483d9acc199d19e -size 69034 diff --git a/exp/svs_train_visinger2_raw_phn_none_mix/images/discriminator_optim_step_time.png b/exp/svs_train_visinger2_raw_phn_none_mix/images/discriminator_optim_step_time.png deleted file mode 100644 index 350bf58eb57b2af884afac95518b4c08b34609d9..0000000000000000000000000000000000000000 --- a/exp/svs_train_visinger2_raw_phn_none_mix/images/discriminator_optim_step_time.png +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:05723699858e27a6a860f74b5eeedf66efde57495efc7a22e02a580b5f9586ba -size 43341 diff --git a/exp/svs_train_visinger2_raw_phn_none_mix/images/discriminator_real_loss.png b/exp/svs_train_visinger2_raw_phn_none_mix/images/discriminator_real_loss.png deleted file mode 100644 index 59dddde5b81335f56c45d80127c3bcce6e39c446..0000000000000000000000000000000000000000 --- a/exp/svs_train_visinger2_raw_phn_none_mix/images/discriminator_real_loss.png +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:bd8b6e27b5064e5adf81486bd0ab6f72db3ea370727c3d33579043020a3557bc -size 81651 diff --git a/exp/svs_train_visinger2_raw_phn_none_mix/images/discriminator_train_time.png b/exp/svs_train_visinger2_raw_phn_none_mix/images/discriminator_train_time.png deleted file mode 100644 index c3522b952481d1200a7ee7369a78edfb22318e18..0000000000000000000000000000000000000000 --- a/exp/svs_train_visinger2_raw_phn_none_mix/images/discriminator_train_time.png +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:b3fa2e7844d762b109f5609d1db3f5bb49e797ff7ffe2fc902dffaae2cb162e7 -size 41137 diff --git a/exp/svs_train_visinger2_raw_phn_none_mix/images/generator_adv_loss.png b/exp/svs_train_visinger2_raw_phn_none_mix/images/generator_adv_loss.png deleted file mode 100644 index 67deab08c967e715648dccec89ece45e087e7358..0000000000000000000000000000000000000000 --- a/exp/svs_train_visinger2_raw_phn_none_mix/images/generator_adv_loss.png +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:d3d66f20b5a8ffd157b02d429593d3c516e797ba6d64d1ea9a94d905e9132eb5 -size 76140 diff --git a/exp/svs_train_visinger2_raw_phn_none_mix/images/generator_backward_time.png b/exp/svs_train_visinger2_raw_phn_none_mix/images/generator_backward_time.png deleted file mode 100644 index b9dac4ef296daefd8975c6dd47cb4a58b9e61c47..0000000000000000000000000000000000000000 --- a/exp/svs_train_visinger2_raw_phn_none_mix/images/generator_backward_time.png +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:b87014020b976ad56e678dfdb5ce133278ac1fef30a88dbf9ff610c673b886f7 -size 47417 diff --git a/exp/svs_train_visinger2_raw_phn_none_mix/images/generator_feat_match_loss.png b/exp/svs_train_visinger2_raw_phn_none_mix/images/generator_feat_match_loss.png deleted file mode 100644 index 64a5dce01b60ce6ed5cdac8cdc878fd5d9ff6f3b..0000000000000000000000000000000000000000 --- a/exp/svs_train_visinger2_raw_phn_none_mix/images/generator_feat_match_loss.png +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:bd44bc580fb634dc769bc2e105d2a245de1b2850dffa4fcad513c9fb623b500f -size 62407 diff --git a/exp/svs_train_visinger2_raw_phn_none_mix/images/generator_forward_time.png b/exp/svs_train_visinger2_raw_phn_none_mix/images/generator_forward_time.png deleted file mode 100644 index e35807a4b8ca4063447c1d50f80c0bea495c222d..0000000000000000000000000000000000000000 --- a/exp/svs_train_visinger2_raw_phn_none_mix/images/generator_forward_time.png +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:696acbb8cd9cb4fa33210a651bc483e72b3dd8df20a5de4b544648e3c09532cd -size 54217 diff --git a/exp/svs_train_visinger2_raw_phn_none_mix/images/generator_kl_loss.png b/exp/svs_train_visinger2_raw_phn_none_mix/images/generator_kl_loss.png deleted file mode 100644 index 91f4e7a8689e97c65c12ed9ab18e78bf0009e988..0000000000000000000000000000000000000000 --- a/exp/svs_train_visinger2_raw_phn_none_mix/images/generator_kl_loss.png +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:f327358d973d8d7edcc55cab35ea05d567344f918c537a3d731e6d5b29a79d3f -size 45494 diff --git a/exp/svs_train_visinger2_raw_phn_none_mix/images/generator_loss.png b/exp/svs_train_visinger2_raw_phn_none_mix/images/generator_loss.png deleted file mode 100644 index f345075ab27c3c449f85ab415126805731aeb54d..0000000000000000000000000000000000000000 --- a/exp/svs_train_visinger2_raw_phn_none_mix/images/generator_loss.png +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:324fccbb8486b80faca28c3162d20a8d8ec1b30e5fcd422299891d7d7253ea8a -size 33575 diff --git a/exp/svs_train_visinger2_raw_phn_none_mix/images/generator_mel_am_loss.png b/exp/svs_train_visinger2_raw_phn_none_mix/images/generator_mel_am_loss.png deleted file mode 100644 index 8b0e631a205d16c217f80ccc9116f48fbfa00b1d..0000000000000000000000000000000000000000 --- a/exp/svs_train_visinger2_raw_phn_none_mix/images/generator_mel_am_loss.png +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:8c7c694065c7ed753629309788b1daeb72c6181ad6b244c72906fe96dfbf5cce -size 40035 diff --git a/exp/svs_train_visinger2_raw_phn_none_mix/images/generator_mel_ddsp_loss.png b/exp/svs_train_visinger2_raw_phn_none_mix/images/generator_mel_ddsp_loss.png deleted file mode 100644 index 291fa5e950cdf4a0c0cdbf81795709f040ecb256..0000000000000000000000000000000000000000 --- a/exp/svs_train_visinger2_raw_phn_none_mix/images/generator_mel_ddsp_loss.png +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:77c8d8215f851c1cbf6873fd6bd9362656622ccdbd09d841806fe0ff99bec16b -size 42236 diff --git a/exp/svs_train_visinger2_raw_phn_none_mix/images/generator_mel_loss.png b/exp/svs_train_visinger2_raw_phn_none_mix/images/generator_mel_loss.png deleted file mode 100644 index 7e665e244b2176843aa7338afb121dd9b216de4a..0000000000000000000000000000000000000000 --- a/exp/svs_train_visinger2_raw_phn_none_mix/images/generator_mel_loss.png +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:aa4c1a56c64b67c44aec8b719a8e4b63924db9f5a0922b08d77853248a8343fb -size 36412 diff --git a/exp/svs_train_visinger2_raw_phn_none_mix/images/generator_optim_step_time.png b/exp/svs_train_visinger2_raw_phn_none_mix/images/generator_optim_step_time.png deleted file mode 100644 index 3a24392d728fc86589136c3422d70f200a012dd7..0000000000000000000000000000000000000000 --- a/exp/svs_train_visinger2_raw_phn_none_mix/images/generator_optim_step_time.png +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:f487695c628d2eeaaa459d0ec22102ab369d28318ad41907b7888a3f992f0cd7 -size 46340 diff --git a/exp/svs_train_visinger2_raw_phn_none_mix/images/generator_phn_dur_loss.png b/exp/svs_train_visinger2_raw_phn_none_mix/images/generator_phn_dur_loss.png deleted file mode 100644 index 3c66305096cb0394aae3447a61aeeb332525c9f6..0000000000000000000000000000000000000000 --- a/exp/svs_train_visinger2_raw_phn_none_mix/images/generator_phn_dur_loss.png +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:d0e27840cc6152dbb9fbd0f9d54ef6f2ec59929879d8248bf3726d9e00c09981 -size 34419 diff --git a/exp/svs_train_visinger2_raw_phn_none_mix/images/generator_pitch_loss.png b/exp/svs_train_visinger2_raw_phn_none_mix/images/generator_pitch_loss.png deleted file mode 100644 index 4f846ffda2865956e2269f3ee03942a27c9b574d..0000000000000000000000000000000000000000 --- a/exp/svs_train_visinger2_raw_phn_none_mix/images/generator_pitch_loss.png +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:5ade6be19950ae5ec95127fdc45882c8875dadced0bd65fd6f0375e8e73193bc -size 41108 diff --git a/exp/svs_train_visinger2_raw_phn_none_mix/images/generator_score_dur_loss.png b/exp/svs_train_visinger2_raw_phn_none_mix/images/generator_score_dur_loss.png deleted file mode 100644 index 74c3b0b0203480ddcead54b0c99043256edbea43..0000000000000000000000000000000000000000 --- a/exp/svs_train_visinger2_raw_phn_none_mix/images/generator_score_dur_loss.png +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:4a004a15e60922fc8dbdc6abe9607ccef720c9904730110f7121bd470507b9a5 -size 35591 diff --git a/exp/svs_train_visinger2_raw_phn_none_mix/images/generator_train_time.png b/exp/svs_train_visinger2_raw_phn_none_mix/images/generator_train_time.png deleted file mode 100644 index 650ee1cabd7ff2d02a48fbf017246ccb6ce941f7..0000000000000000000000000000000000000000 --- a/exp/svs_train_visinger2_raw_phn_none_mix/images/generator_train_time.png +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:f6abcc8576877e2b4c467b0715e750df72e2c81ddc587d8eafd5671967c60dc9 -size 47483 diff --git a/exp/svs_train_visinger2_raw_phn_none_mix/images/gpu_max_cached_mem_GB.png b/exp/svs_train_visinger2_raw_phn_none_mix/images/gpu_max_cached_mem_GB.png deleted file mode 100644 index 708589bb7a1da1ab88a71bdd7c7b119a70f8f3b6..0000000000000000000000000000000000000000 --- a/exp/svs_train_visinger2_raw_phn_none_mix/images/gpu_max_cached_mem_GB.png +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:510b013e54b86f364104a00e3d8751aedd3583369fc186487439ac670d1b38dd -size 27850 diff --git a/exp/svs_train_visinger2_raw_phn_none_mix/images/iter_time.png b/exp/svs_train_visinger2_raw_phn_none_mix/images/iter_time.png deleted file mode 100644 index ec2b36e4dc4b36b8a741529db6a39e419c14c6a1..0000000000000000000000000000000000000000 --- a/exp/svs_train_visinger2_raw_phn_none_mix/images/iter_time.png +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:24e709b88b61ca07683b62d1338e4b7905c5d1f9d01953701c91ced86d16cc1a -size 40059 diff --git a/exp/svs_train_visinger2_raw_phn_none_mix/images/optim0_lr0.png b/exp/svs_train_visinger2_raw_phn_none_mix/images/optim0_lr0.png deleted file mode 100644 index 2919f472b7ed8aecbc88f9a1e8292395680c3980..0000000000000000000000000000000000000000 --- a/exp/svs_train_visinger2_raw_phn_none_mix/images/optim0_lr0.png +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:172e6b2bb6d0408d84b2c15751f3f639aa70be783dd06dabe5026abc2296e862 -size 29569 diff --git a/exp/svs_train_visinger2_raw_phn_none_mix/images/optim1_lr0.png b/exp/svs_train_visinger2_raw_phn_none_mix/images/optim1_lr0.png deleted file mode 100644 index dda2dd4f938ee43deb88ca07c1eb518c0cd8996e..0000000000000000000000000000000000000000 --- a/exp/svs_train_visinger2_raw_phn_none_mix/images/optim1_lr0.png +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:00a96617ad7d53e985319525806f3c6a6e93555ab6f6a4cd014e97f2ded1ca17 -size 29370 diff --git a/exp/svs_train_visinger2_raw_phn_none_mix/images/train_time.png b/exp/svs_train_visinger2_raw_phn_none_mix/images/train_time.png deleted file mode 100644 index e54a62523180f7009211a49704eb340a191406bf..0000000000000000000000000000000000000000 --- a/exp/svs_train_visinger2_raw_phn_none_mix/images/train_time.png +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:8d7307370394806818c969ecf5ce838aac66292f62ea4b1aa36ea15483095fbd -size 44435 diff --git a/exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/500epoch.pth b/exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/500epoch.pth new file mode 100644 index 0000000000000000000000000000000000000000..eb2e3dbfe65a3747e6656d07f201da13df4499cc --- /dev/null +++ b/exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/500epoch.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c93a08500a8958e48a57dd6780033635d11916de8e1d72a8691124ef2eb95f2a +size 448412302 diff --git a/exp/svs_train_visinger2_raw_phn_none_mix/config.yaml b/exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/config.yaml similarity index 97% rename from exp/svs_train_visinger2_raw_phn_none_mix/config.yaml rename to exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/config.yaml index 25e5540dee47b0635ec4382f9618fbb016543288..42c65aff517a8c9fb62200f52f6fa23f853cc1c1 100644 --- a/exp/svs_train_visinger2_raw_phn_none_mix/config.yaml +++ b/exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/config.yaml @@ -1,11 +1,11 @@ -config: conf/tuning/train_visinger2.yaml +config: conf/tuning/train_visinger2_spk_embed_lang.yaml print_config: false log_level: INFO drop_last_iter: false dry_run: false iterator_type: sequence valid_iterator_type: null -output_dir: exp/svs_train_visinger2_raw_phn_none_mix +output_dir: exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix ngpu: 1 seed: 777 num_workers: 0 @@ -224,8 +224,8 @@ token_list: - an@zh - en@zh - iou@zh -- t@zh - ou@zh +- t@zh - ao@zh - ong@zh - iang@zh @@ -319,16 +319,15 @@ feats_extract_conf: fmin: 80 fmax: 22050 n_mels: 80 -normalize: global_mvn -normalize_conf: - stats_file: exp/svs_stats_raw_phn_none_mix/train/feats_stats.npz +normalize: null +normalize_conf: {} svs: vits svs_conf: generator_type: visinger2 vocoder_generator_type: visinger2 generator_params: hidden_channels: 192 - spks: 94 + spk_embed_dim: 192 langs: 3 global_channels: 256 segment_size: 20 @@ -538,5 +537,5 @@ energy_normalize_conf: {} required: - output_dir - token_list -version: '202412' +version: '202503' distributed: false diff --git a/exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/discriminator_backward_time.png b/exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/discriminator_backward_time.png new file mode 100644 index 0000000000000000000000000000000000000000..f8aa9e45293e88e7a5851bbaf424de54512b00ee Binary files /dev/null and b/exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/discriminator_backward_time.png differ diff --git a/exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/discriminator_fake_loss.png b/exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/discriminator_fake_loss.png new file mode 100644 index 0000000000000000000000000000000000000000..54e71779e78a1d5f94c06059b53523ad51ce009a Binary files /dev/null and b/exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/discriminator_fake_loss.png differ diff --git a/exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/discriminator_forward_time.png b/exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/discriminator_forward_time.png new file mode 100644 index 0000000000000000000000000000000000000000..0b075910600166632b3525253ec76a1c446635e9 Binary files /dev/null and b/exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/discriminator_forward_time.png differ diff --git a/exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/discriminator_loss.png b/exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/discriminator_loss.png new file mode 100644 index 0000000000000000000000000000000000000000..e1a6f314d5de1666b10cc2441bc236a840cc3f48 Binary files /dev/null and b/exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/discriminator_loss.png differ diff --git a/exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/discriminator_optim_step_time.png b/exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/discriminator_optim_step_time.png new file mode 100644 index 0000000000000000000000000000000000000000..ae01b2bac01d0d419d5a44d20d066498e383128b Binary files /dev/null and b/exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/discriminator_optim_step_time.png differ diff --git a/exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/discriminator_real_loss.png b/exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/discriminator_real_loss.png new file mode 100644 index 0000000000000000000000000000000000000000..c2a86f77a95086841f27a1972a030da6e6c3862d Binary files /dev/null and b/exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/discriminator_real_loss.png differ diff --git a/exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/discriminator_train_time.png b/exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/discriminator_train_time.png new file mode 100644 index 0000000000000000000000000000000000000000..5e5e3d87648b915dc21baf2ea3038896dd62eeb7 Binary files /dev/null and b/exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/discriminator_train_time.png differ diff --git a/exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_adv_loss.png b/exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_adv_loss.png new file mode 100644 index 0000000000000000000000000000000000000000..8d3c88366348be0ff122e30212c5a930924a4647 Binary files /dev/null and b/exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_adv_loss.png differ diff --git a/exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_backward_time.png b/exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_backward_time.png new file mode 100644 index 0000000000000000000000000000000000000000..310ccf2963d4e7169a66f739b1c14a3441718cae Binary files /dev/null and b/exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_backward_time.png differ diff --git a/exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_feat_match_loss.png b/exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_feat_match_loss.png new file mode 100644 index 0000000000000000000000000000000000000000..83d7dca854eeb7287e1e10bee4408981c5a7cf64 Binary files /dev/null and b/exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_feat_match_loss.png differ diff --git a/exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_forward_time.png b/exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_forward_time.png new file mode 100644 index 0000000000000000000000000000000000000000..fbb90e4a7e1f63e51d2118520b207d023fe32d7c Binary files /dev/null and b/exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_forward_time.png differ diff --git a/exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_kl_loss.png b/exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_kl_loss.png new file mode 100644 index 0000000000000000000000000000000000000000..496322ed9d9476b1e7988b197382654c6608aa01 Binary files /dev/null and b/exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_kl_loss.png differ diff --git a/exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_loss.png b/exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_loss.png new file mode 100644 index 0000000000000000000000000000000000000000..9c7f78398de9b19c676d9cbfc296af617cb3110f Binary files /dev/null and b/exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_loss.png differ diff --git a/exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_mel_am_loss.png b/exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_mel_am_loss.png new file mode 100644 index 0000000000000000000000000000000000000000..345d6f6cb9bf7271c2e2dc050bbed2b92e601bba Binary files /dev/null and b/exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_mel_am_loss.png differ diff --git a/exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_mel_ddsp_loss.png b/exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_mel_ddsp_loss.png new file mode 100644 index 0000000000000000000000000000000000000000..ac8269f49dcddeb21daedf145bc9bf8cf31517bd Binary files /dev/null and b/exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_mel_ddsp_loss.png differ diff --git a/exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_mel_loss.png b/exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_mel_loss.png new file mode 100644 index 0000000000000000000000000000000000000000..ea60354dc4097cfa0c8b87ae08d2632745bf06e0 Binary files /dev/null and b/exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_mel_loss.png differ diff --git a/exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_optim_step_time.png b/exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_optim_step_time.png new file mode 100644 index 0000000000000000000000000000000000000000..ba0592bd11272438e2a24e25726135a654f26700 Binary files /dev/null and b/exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_optim_step_time.png differ diff --git a/exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_phn_dur_loss.png b/exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_phn_dur_loss.png new file mode 100644 index 0000000000000000000000000000000000000000..ba235b32ffa7603bfecc4a634594ae0d740d8997 Binary files /dev/null and b/exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_phn_dur_loss.png differ diff --git a/exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_pitch_loss.png b/exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_pitch_loss.png new file mode 100644 index 0000000000000000000000000000000000000000..d15e8336515f831f67bbe3ef3b6b051778040b6c Binary files /dev/null and b/exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_pitch_loss.png differ diff --git a/exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_score_dur_loss.png b/exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_score_dur_loss.png new file mode 100644 index 0000000000000000000000000000000000000000..f895f9ef42d5ac33c060314bdf7d42d2ed50acbd Binary files /dev/null and b/exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_score_dur_loss.png differ diff --git a/exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_train_time.png b/exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_train_time.png new file mode 100644 index 0000000000000000000000000000000000000000..d901de4d88aabcba9493f4ecdd4dd962b10bc50a Binary files /dev/null and b/exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/generator_train_time.png differ diff --git a/exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/gpu_max_cached_mem_GB.png b/exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/gpu_max_cached_mem_GB.png new file mode 100644 index 0000000000000000000000000000000000000000..e19d4fafb2fdd3004d2f82dad4e752a92d25b0e6 Binary files /dev/null and b/exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/gpu_max_cached_mem_GB.png differ diff --git a/exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/iter_time.png b/exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/iter_time.png new file mode 100644 index 0000000000000000000000000000000000000000..9c64950b026b31ce573625431ad16e22c2c73d74 Binary files /dev/null and b/exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/iter_time.png differ diff --git a/exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/optim0_lr0.png b/exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/optim0_lr0.png new file mode 100644 index 0000000000000000000000000000000000000000..b2f756b704b67ebf9ed2a5a702e5fe17d78a62ce Binary files /dev/null and b/exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/optim0_lr0.png differ diff --git a/exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/optim1_lr0.png b/exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/optim1_lr0.png new file mode 100644 index 0000000000000000000000000000000000000000..b6d16a49dc7ca1d339a50d906c5305ac0027b134 Binary files /dev/null and b/exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/optim1_lr0.png differ diff --git a/exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/train_time.png b/exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/train_time.png new file mode 100644 index 0000000000000000000000000000000000000000..863020c4f39f59cbbf99b5b58b75190c11720ec7 Binary files /dev/null and b/exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/images/train_time.png differ diff --git a/meta.yaml b/meta.yaml new file mode 100644 index 0000000000000000000000000000000000000000..d63eb2eff37dd08b19cbe26ea19b9f3aa8b11f32 --- /dev/null +++ b/meta.yaml @@ -0,0 +1,8 @@ +espnet: '202503' +files: + model_file: exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/500epoch.pth +python: 3.10.16 (main, Dec 11 2024, 16:24:50) [GCC 11.2.0] +timestamp: 1751437686.716423 +torch: 2.5.1+cu124 +yaml_files: + train_config: exp/svs_train_visinger2_spk_embed_lang_raw_phn_none_mix/config.yaml