Upload folder using huggingface_hub
Browse files
LJSpeech6/config.yml
CHANGED
@@ -1,21 +1,118 @@
|
|
1 |
-
|
2 |
-
|
3 |
-
|
4 |
-
|
5 |
-
|
6 |
-
|
7 |
-
|
8 |
-
|
9 |
-
|
10 |
-
|
11 |
-
|
12 |
-
|
13 |
-
|
14 |
-
|
15 |
-
|
16 |
-
|
17 |
-
|
18 |
-
|
19 |
-
|
20 |
-
|
21 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
log_dir: "Models/LJSpeech6"
|
2 |
+
first_stage_path: "first_stage.pth"
|
3 |
+
save_freq: 1
|
4 |
+
log_interval: 10
|
5 |
+
device: "cuda"
|
6 |
+
epochs_1st: 2000 # number of epochs for first stage training (pre-training)
|
7 |
+
epochs_2nd: 300 # number of peochs for second stage training (joint training)
|
8 |
+
# first epoch = 3x650
|
9 |
+
# second epoch = 2x440
|
10 |
+
# second stage 1st epoch = 2x300
|
11 |
+
batch_size: 2
|
12 |
+
max_len: 550 # maximum number of frames
|
13 |
+
pretrained_model: "LJSpeech6/epoch_2nd_00171.pth"
|
14 |
+
second_stage_load_pretrained: true # set to true if the pre-trained model is for 2nd stage
|
15 |
+
load_only_params: false # set to true if do not want to load epoch numbers and optimizer parameters
|
16 |
+
|
17 |
+
F0_path: "Utils/JDC/bst.t7"
|
18 |
+
ASR_config: "Utils/ASR/config.yml"
|
19 |
+
ASR_path: "Utils/ASR/epoch_00080.pth"
|
20 |
+
PLBERT_dir: 'Utils/PLBERT/'
|
21 |
+
|
22 |
+
data_params:
|
23 |
+
train_data: "Data/train_list.txt"
|
24 |
+
val_data: "Data/val_list.txt"
|
25 |
+
root_path: "/content/StyleTTS2/Dataset"
|
26 |
+
OOD_data: "Data/OOD_texts.txt"
|
27 |
+
min_length: 50 # sample until texts with this size are obtained for OOD texts
|
28 |
+
|
29 |
+
preprocess_params:
|
30 |
+
sr: 24000
|
31 |
+
spect_params:
|
32 |
+
n_fft: 2048
|
33 |
+
win_length: 1200
|
34 |
+
hop_length: 300
|
35 |
+
|
36 |
+
model_params:
|
37 |
+
multispeaker: false
|
38 |
+
|
39 |
+
dim_in: 64
|
40 |
+
hidden_dim: 512
|
41 |
+
max_conv_dim: 512
|
42 |
+
n_layer: 3
|
43 |
+
n_mels: 80
|
44 |
+
|
45 |
+
n_token: 185 # number of phoneme tokens
|
46 |
+
max_dur: 50 # maximum duration of a single phoneme
|
47 |
+
style_dim: 128 # style vector size
|
48 |
+
|
49 |
+
dropout: 0.2
|
50 |
+
|
51 |
+
# config for decoder
|
52 |
+
decoder:
|
53 |
+
type: 'istftnet' # either hifigan or istftnet
|
54 |
+
resblock_kernel_sizes: [3,7,11]
|
55 |
+
upsample_rates : [10, 6]
|
56 |
+
upsample_initial_channel: 512
|
57 |
+
resblock_dilation_sizes: [[1,3,5], [1,3,5], [1,3,5]]
|
58 |
+
upsample_kernel_sizes: [20, 12]
|
59 |
+
gen_istft_n_fft: 20
|
60 |
+
gen_istft_hop_size: 5
|
61 |
+
|
62 |
+
# speech language model config
|
63 |
+
slm:
|
64 |
+
model: 'microsoft/wavlm-base-plus'
|
65 |
+
sr: 16000 # sampling rate of SLM
|
66 |
+
hidden: 768 # hidden size of SLM
|
67 |
+
nlayers: 13 # number of layers of SLM
|
68 |
+
initial_channel: 64 # initial channels of SLM discriminator head
|
69 |
+
|
70 |
+
# style diffusion model config
|
71 |
+
diffusion:
|
72 |
+
embedding_mask_proba: 0.1
|
73 |
+
# transformer config
|
74 |
+
transformer:
|
75 |
+
num_layers: 3
|
76 |
+
num_heads: 8
|
77 |
+
head_features: 64
|
78 |
+
multiplier: 2
|
79 |
+
|
80 |
+
# diffusion distribution config
|
81 |
+
dist:
|
82 |
+
sigma_data: 0.2 # placeholder for estimate_sigma_data set to false
|
83 |
+
estimate_sigma_data: true # estimate sigma_data from the current batch if set to true
|
84 |
+
mean: -3.0
|
85 |
+
std: 1.0
|
86 |
+
|
87 |
+
loss_params:
|
88 |
+
lambda_mel: 5. # mel reconstruction loss
|
89 |
+
lambda_gen: 1. # generator loss
|
90 |
+
lambda_slm: 1. # slm feature matching loss
|
91 |
+
|
92 |
+
lambda_mono: 1. # monotonic alignment loss (1st stage, TMA)
|
93 |
+
lambda_s2s: 1. # sequence-to-sequence loss (1st stage, TMA)
|
94 |
+
TMA_epoch: 2 # TMA starting epoch (1st stage)
|
95 |
+
|
96 |
+
lambda_F0: 1. # F0 reconstruction loss (2nd stage)
|
97 |
+
lambda_norm: 1. # norm reconstruction loss (2nd stage)
|
98 |
+
lambda_dur: 1. # duration loss (2nd stage)
|
99 |
+
lambda_ce: 20. # duration predictor probability output CE loss (2nd stage)
|
100 |
+
lambda_sty: 1. # style reconstruction loss (2nd stage)
|
101 |
+
lambda_diff: 1. # score matching loss (2nd stage)
|
102 |
+
|
103 |
+
diff_epoch: 0 # style diffusion starting epoch (2nd stage)
|
104 |
+
joint_epoch: 0 # joint training starting epoch (2nd stage)
|
105 |
+
|
106 |
+
optimizer_params:
|
107 |
+
lr: 0.0001 # general learning rate
|
108 |
+
bert_lr: 0.00001 # learning rate for PLBERT
|
109 |
+
ft_lr: 0.00001 # learning rate for acoustic modules
|
110 |
+
|
111 |
+
slmadv_params:
|
112 |
+
min_len: 400 # minimum length of samples
|
113 |
+
max_len: 500 # maximum length of samples
|
114 |
+
batch_percentage: 1 # to prevent out of memory, only use half of the original batch size
|
115 |
+
iter: 10 # update the discriminator every this iterations of generator update
|
116 |
+
thresh: 5 # gradient norm above which the gradient is scaled
|
117 |
+
scale: 0.01 # gradient scaling factor for predictors from SLM discriminators
|
118 |
+
sig: 1.5 # sigma for differentiable duration modeling
|
LJSpeech6/epoch_2nd_00172.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f23ce02282028632e56d8a12dea0a92f349b30055757d40e465e236864118af4
|
3 |
+
size 1279652187
|
LJSpeech6/tensorboard/events.out.tfevents.1745042681.c1102d9153bb.9929.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:56ce906b492728aa55abb20ad7de48a0cd75b495644c5600806a38dc8b92a36a
|
3 |
+
size 28618
|
LJSpeech6/train.log
CHANGED
@@ -1,73 +1,90 @@
|
|
1 |
-
INFO:2025-04-19
|
2 |
-
INFO:2025-04-19
|
3 |
-
INFO:2025-04-19
|
4 |
-
INFO:2025-04-19
|
5 |
-
INFO:2025-04-19
|
6 |
-
INFO:2025-04-19
|
7 |
-
INFO:2025-04-19
|
8 |
-
INFO:2025-04-19
|
9 |
-
INFO:2025-04-19
|
10 |
-
INFO:2025-04-19
|
11 |
-
INFO:2025-04-19
|
12 |
-
INFO:2025-04-19
|
13 |
-
INFO:2025-04-19
|
14 |
-
INFO:2025-04-19
|
15 |
-
INFO:2025-04-19
|
16 |
-
INFO:2025-04-19
|
17 |
-
INFO:2025-04-19
|
18 |
-
INFO:2025-04-19
|
19 |
-
INFO:2025-04-19
|
20 |
-
INFO:2025-04-19
|
21 |
-
INFO:2025-04-19
|
22 |
-
INFO:2025-04-19
|
23 |
-
INFO:2025-04-19
|
24 |
-
INFO:2025-04-19
|
25 |
-
INFO:2025-04-19
|
26 |
-
INFO:2025-04-19
|
27 |
-
INFO:2025-04-19
|
28 |
-
INFO:2025-04-19
|
29 |
-
INFO:2025-04-19
|
30 |
-
INFO:2025-04-19
|
31 |
-
INFO:2025-04-19
|
32 |
-
INFO:2025-04-19
|
33 |
-
INFO:2025-04-19
|
34 |
-
INFO:2025-04-19
|
35 |
-
INFO:2025-04-19
|
36 |
-
INFO:2025-04-19
|
37 |
-
INFO:2025-04-19
|
38 |
-
INFO:2025-04-19
|
39 |
-
INFO:2025-04-19
|
40 |
-
INFO:2025-04-19
|
41 |
-
INFO:2025-04-19
|
42 |
-
INFO:2025-04-19
|
43 |
-
INFO:2025-04-19
|
44 |
-
INFO:2025-04-19
|
45 |
-
INFO:2025-04-19
|
46 |
-
INFO:2025-04-19
|
47 |
-
INFO:2025-04-19
|
48 |
-
INFO:2025-04-19
|
49 |
-
INFO:2025-04-19
|
50 |
-
INFO:2025-04-19
|
51 |
-
INFO:2025-04-19
|
52 |
-
INFO:2025-04-19
|
53 |
-
INFO:2025-04-19
|
54 |
-
INFO:2025-04-19
|
55 |
-
INFO:2025-04-19
|
56 |
-
INFO:2025-04-19
|
57 |
-
INFO:2025-04-19
|
58 |
-
INFO:2025-04-19
|
59 |
-
INFO:2025-04-19
|
60 |
-
INFO:2025-04-19
|
61 |
-
INFO:2025-04-19
|
62 |
-
INFO:2025-04-19
|
63 |
-
INFO:2025-04-19
|
64 |
-
INFO:2025-04-19
|
65 |
-
INFO:2025-04-19
|
66 |
-
INFO:2025-04-19
|
67 |
-
INFO:2025-04-19
|
68 |
-
INFO:2025-04-19
|
69 |
-
INFO:2025-04-19
|
70 |
-
INFO:2025-04-19
|
71 |
-
INFO:2025-04-19
|
72 |
-
INFO:2025-04-19
|
73 |
-
INFO:2025-04-19
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
INFO:2025-04-19 06:05:32,373: Epoch [172/2000], Step [10/103], Mel Loss: 0.49075, Gen Loss: 19.03080, Disc Loss: 1.87808, Mono Loss: 0.02912, S2S Loss: 2.88279, SLM Loss: 2.22280
|
2 |
+
INFO:2025-04-19 06:06:00,507: Epoch [172/2000], Step [20/103], Mel Loss: 0.46514, Gen Loss: 16.48240, Disc Loss: 2.28683, Mono Loss: 0.08921, S2S Loss: 3.05974, SLM Loss: 2.28222
|
3 |
+
INFO:2025-04-19 06:06:32,628: Epoch [172/2000], Step [30/103], Mel Loss: 0.49943, Gen Loss: 20.04922, Disc Loss: 1.67373, Mono Loss: 0.03095, S2S Loss: 3.09345, SLM Loss: 2.28325
|
4 |
+
INFO:2025-04-19 06:07:04,133: Epoch [172/2000], Step [40/103], Mel Loss: 0.49957, Gen Loss: 18.65599, Disc Loss: 1.82620, Mono Loss: 0.02344, S2S Loss: 2.88804, SLM Loss: 2.36621
|
5 |
+
INFO:2025-04-19 06:07:35,300: Epoch [172/2000], Step [50/103], Mel Loss: 0.47768, Gen Loss: 18.86207, Disc Loss: 2.09690, Mono Loss: 0.02290, S2S Loss: 3.06059, SLM Loss: 2.14493
|
6 |
+
INFO:2025-04-19 06:08:07,153: Epoch [172/2000], Step [60/103], Mel Loss: 0.52728, Gen Loss: 20.18369, Disc Loss: 1.82205, Mono Loss: 0.03392, S2S Loss: 3.04808, SLM Loss: 2.19737
|
7 |
+
INFO:2025-04-19 06:08:40,051: Epoch [172/2000], Step [70/103], Mel Loss: 0.50537, Gen Loss: 21.64199, Disc Loss: 1.55544, Mono Loss: 0.03042, S2S Loss: 2.95961, SLM Loss: 2.20869
|
8 |
+
INFO:2025-04-19 06:09:10,152: Epoch [172/2000], Step [80/103], Mel Loss: 0.50642, Gen Loss: 20.74788, Disc Loss: 1.58680, Mono Loss: 0.02950, S2S Loss: 3.19282, SLM Loss: 2.37025
|
9 |
+
INFO:2025-04-19 06:09:40,105: Epoch [172/2000], Step [90/103], Mel Loss: 0.49223, Gen Loss: 19.06367, Disc Loss: 2.18111, Mono Loss: 0.05383, S2S Loss: 2.64033, SLM Loss: 2.28037
|
10 |
+
INFO:2025-04-19 06:10:11,766: Epoch [172/2000], Step [100/103], Mel Loss: 0.49026, Gen Loss: 19.62444, Disc Loss: 1.59637, Mono Loss: 0.02270, S2S Loss: 2.71941, SLM Loss: 2.29486
|
11 |
+
INFO:2025-04-19 06:11:03,987: Epoch [173/2000], Step [10/103], Mel Loss: 0.51189, Gen Loss: 21.01040, Disc Loss: 1.54343, Mono Loss: 0.02302, S2S Loss: 3.00716, SLM Loss: 2.27467
|
12 |
+
INFO:2025-04-19 06:11:33,694: Epoch [173/2000], Step [20/103], Mel Loss: 0.48045, Gen Loss: 20.46531, Disc Loss: 1.54627, Mono Loss: 0.02493, S2S Loss: 2.70191, SLM Loss: 2.23879
|
13 |
+
INFO:2025-04-19 06:12:05,064: Epoch [173/2000], Step [30/103], Mel Loss: 0.49242, Gen Loss: 18.44250, Disc Loss: 1.85066, Mono Loss: 0.02167, S2S Loss: 2.54103, SLM Loss: 2.19616
|
14 |
+
INFO:2025-04-19 06:12:33,674: Epoch [173/2000], Step [40/103], Mel Loss: 0.46743, Gen Loss: 19.72079, Disc Loss: 1.66980, Mono Loss: 0.02674, S2S Loss: 2.93780, SLM Loss: 2.26917
|
15 |
+
INFO:2025-04-19 06:13:05,168: Epoch [173/2000], Step [50/103], Mel Loss: 0.48814, Gen Loss: 19.04391, Disc Loss: 2.00274, Mono Loss: 0.02832, S2S Loss: 2.75156, SLM Loss: 2.13500
|
16 |
+
INFO:2025-04-19 06:13:35,836: Epoch [173/2000], Step [60/103], Mel Loss: 0.50107, Gen Loss: 21.10793, Disc Loss: 1.52648, Mono Loss: 0.02576, S2S Loss: 2.82060, SLM Loss: 2.22685
|
17 |
+
INFO:2025-04-19 06:14:06,995: Epoch [173/2000], Step [70/103], Mel Loss: 0.51913, Gen Loss: 19.93866, Disc Loss: 1.66394, Mono Loss: 0.01771, S2S Loss: 2.49649, SLM Loss: 2.36162
|
18 |
+
INFO:2025-04-19 06:14:38,615: Epoch [173/2000], Step [80/103], Mel Loss: 0.49018, Gen Loss: 20.08590, Disc Loss: 1.49651, Mono Loss: 0.02133, S2S Loss: 2.96537, SLM Loss: 2.48091
|
19 |
+
INFO:2025-04-19 06:15:10,434: Epoch [173/2000], Step [90/103], Mel Loss: 0.50108, Gen Loss: 20.89732, Disc Loss: 1.62664, Mono Loss: 0.02150, S2S Loss: 2.67248, SLM Loss: 2.29798
|
20 |
+
INFO:2025-04-19 06:15:41,642: Epoch [173/2000], Step [100/103], Mel Loss: 0.46766, Gen Loss: 20.14573, Disc Loss: 1.63960, Mono Loss: 0.01970, S2S Loss: 2.61184, SLM Loss: 2.27835
|
21 |
+
INFO:2025-04-19 06:16:46,073: Epoch [174/2000], Step [10/103], Mel Loss: 0.50016, Gen Loss: 20.55195, Disc Loss: 1.52571, Mono Loss: 0.02179, S2S Loss: 2.65634, SLM Loss: 2.22372
|
22 |
+
INFO:2025-04-19 06:17:16,408: Epoch [174/2000], Step [20/103], Mel Loss: 0.49517, Gen Loss: 19.28646, Disc Loss: 1.76686, Mono Loss: 0.03635, S2S Loss: 3.09372, SLM Loss: 2.41635
|
23 |
+
INFO:2025-04-19 06:17:47,544: Epoch [174/2000], Step [30/103], Mel Loss: 0.50201, Gen Loss: 19.60267, Disc Loss: 1.74641, Mono Loss: 0.02212, S2S Loss: 2.79624, SLM Loss: 2.23391
|
24 |
+
INFO:2025-04-19 06:18:19,227: Epoch [174/2000], Step [40/103], Mel Loss: 0.45649, Gen Loss: 18.76392, Disc Loss: 1.86530, Mono Loss: 0.02307, S2S Loss: 2.87715, SLM Loss: 2.25671
|
25 |
+
INFO:2025-04-19 06:18:50,529: Epoch [174/2000], Step [50/103], Mel Loss: 0.50979, Gen Loss: 20.16633, Disc Loss: 1.63595, Mono Loss: 0.02933, S2S Loss: 2.76850, SLM Loss: 2.20160
|
26 |
+
INFO:2025-04-19 06:19:21,746: Epoch [174/2000], Step [60/103], Mel Loss: 0.49076, Gen Loss: 21.23984, Disc Loss: 1.59732, Mono Loss: 0.02372, S2S Loss: 2.90743, SLM Loss: 2.26471
|
27 |
+
INFO:2025-04-19 06:19:52,417: Epoch [174/2000], Step [70/103], Mel Loss: 0.48607, Gen Loss: 20.12070, Disc Loss: 1.82636, Mono Loss: 0.02717, S2S Loss: 2.90649, SLM Loss: 2.30423
|
28 |
+
INFO:2025-04-19 06:20:23,276: Epoch [174/2000], Step [80/103], Mel Loss: 0.47872, Gen Loss: 18.12522, Disc Loss: 2.01864, Mono Loss: 0.04236, S2S Loss: 2.67879, SLM Loss: 2.22928
|
29 |
+
INFO:2025-04-19 06:20:52,625: Epoch [174/2000], Step [90/103], Mel Loss: 0.47791, Gen Loss: 19.27369, Disc Loss: 1.76845, Mono Loss: 0.02332, S2S Loss: 3.05484, SLM Loss: 2.30379
|
30 |
+
INFO:2025-04-19 06:21:23,516: Epoch [174/2000], Step [100/103], Mel Loss: 0.48185, Gen Loss: 19.48250, Disc Loss: 1.91460, Mono Loss: 0.03009, S2S Loss: 2.77278, SLM Loss: 2.27458
|
31 |
+
INFO:2025-04-19 06:22:11,388: Epoch [175/2000], Step [10/103], Mel Loss: 0.47567, Gen Loss: 17.67046, Disc Loss: 2.03858, Mono Loss: 0.01649, S2S Loss: 2.63230, SLM Loss: 2.30893
|
32 |
+
INFO:2025-04-19 06:22:40,567: Epoch [175/2000], Step [20/103], Mel Loss: 0.47005, Gen Loss: 20.80192, Disc Loss: 1.59534, Mono Loss: 0.02183, S2S Loss: 2.78372, SLM Loss: 2.25107
|
33 |
+
INFO:2025-04-19 06:23:11,917: Epoch [175/2000], Step [30/103], Mel Loss: 0.50285, Gen Loss: 18.19817, Disc Loss: 2.01388, Mono Loss: 0.02578, S2S Loss: 2.60506, SLM Loss: 2.26861
|
34 |
+
INFO:2025-04-19 06:23:43,133: Epoch [175/2000], Step [40/103], Mel Loss: 0.49708, Gen Loss: 19.73482, Disc Loss: 1.70221, Mono Loss: 0.02521, S2S Loss: 2.68974, SLM Loss: 2.34267
|
35 |
+
INFO:2025-04-19 06:24:15,796: Epoch [175/2000], Step [50/103], Mel Loss: 0.49577, Gen Loss: 16.78472, Disc Loss: 2.31061, Mono Loss: 0.01824, S2S Loss: 2.42907, SLM Loss: 2.10514
|
36 |
+
INFO:2025-04-19 06:24:45,215: Epoch [175/2000], Step [60/103], Mel Loss: 0.49325, Gen Loss: 16.72832, Disc Loss: 2.22673, Mono Loss: 0.01935, S2S Loss: 2.05736, SLM Loss: 2.24337
|
37 |
+
INFO:2025-04-19 06:25:17,381: Epoch [175/2000], Step [70/103], Mel Loss: 0.50182, Gen Loss: 20.08214, Disc Loss: 1.75990, Mono Loss: 0.02761, S2S Loss: 2.43929, SLM Loss: 2.16661
|
38 |
+
INFO:2025-04-19 06:25:50,573: Epoch [175/2000], Step [80/103], Mel Loss: 0.49850, Gen Loss: 16.85787, Disc Loss: 2.16622, Mono Loss: 0.01707, S2S Loss: 2.29181, SLM Loss: 2.11115
|
39 |
+
INFO:2025-04-19 06:26:21,499: Epoch [175/2000], Step [90/103], Mel Loss: 0.49080, Gen Loss: 16.81436, Disc Loss: 2.10099, Mono Loss: 0.01821, S2S Loss: 2.57103, SLM Loss: 2.33462
|
40 |
+
INFO:2025-04-19 06:26:49,755: Epoch [175/2000], Step [100/103], Mel Loss: 0.46375, Gen Loss: 20.21952, Disc Loss: 1.58607, Mono Loss: 0.02129, S2S Loss: 2.59301, SLM Loss: 2.31743
|
41 |
+
INFO:2025-04-19 06:27:55,438: Epoch [176/2000], Step [10/103], Mel Loss: 0.49432, Gen Loss: 20.54411, Disc Loss: 1.63887, Mono Loss: 0.03046, S2S Loss: 2.25931, SLM Loss: 2.28496
|
42 |
+
INFO:2025-04-19 06:28:26,357: Epoch [176/2000], Step [20/103], Mel Loss: 0.47363, Gen Loss: 20.38404, Disc Loss: 1.77792, Mono Loss: 0.01983, S2S Loss: 2.60933, SLM Loss: 2.15457
|
43 |
+
INFO:2025-04-19 06:28:58,309: Epoch [176/2000], Step [30/103], Mel Loss: 0.49916, Gen Loss: 21.28178, Disc Loss: 1.47651, Mono Loss: 0.02568, S2S Loss: 2.65421, SLM Loss: 2.37266
|
44 |
+
INFO:2025-04-19 06:29:30,100: Epoch [176/2000], Step [40/103], Mel Loss: 0.50341, Gen Loss: 20.84227, Disc Loss: 1.53226, Mono Loss: 0.02120, S2S Loss: 2.51422, SLM Loss: 2.33485
|
45 |
+
INFO:2025-04-19 06:29:59,951: Epoch [176/2000], Step [50/103], Mel Loss: 0.50593, Gen Loss: 20.08417, Disc Loss: 1.64240, Mono Loss: 0.02494, S2S Loss: 2.45440, SLM Loss: 2.25015
|
46 |
+
INFO:2025-04-19 06:30:29,061: Epoch [176/2000], Step [60/103], Mel Loss: 0.49170, Gen Loss: 18.65475, Disc Loss: 1.99479, Mono Loss: 0.01651, S2S Loss: 2.47974, SLM Loss: 2.20827
|
47 |
+
INFO:2025-04-19 06:31:00,141: Epoch [176/2000], Step [70/103], Mel Loss: 0.52671, Gen Loss: 20.53784, Disc Loss: 1.50106, Mono Loss: 0.02845, S2S Loss: 2.69853, SLM Loss: 2.40133
|
48 |
+
INFO:2025-04-19 06:31:31,831: Epoch [176/2000], Step [80/103], Mel Loss: 0.49103, Gen Loss: 21.17548, Disc Loss: 1.57856, Mono Loss: 0.02808, S2S Loss: 2.29848, SLM Loss: 2.23754
|
49 |
+
INFO:2025-04-19 06:32:02,404: Epoch [176/2000], Step [90/103], Mel Loss: 0.48229, Gen Loss: 18.35145, Disc Loss: 1.93141, Mono Loss: 0.02003, S2S Loss: 2.13283, SLM Loss: 2.07911
|
50 |
+
INFO:2025-04-19 06:32:33,013: Epoch [176/2000], Step [100/103], Mel Loss: 0.47932, Gen Loss: 20.15468, Disc Loss: 1.82538, Mono Loss: 0.01628, S2S Loss: 2.84041, SLM Loss: 2.27381
|
51 |
+
INFO:2025-04-19 06:33:24,254: Epoch [177/2000], Step [10/103], Mel Loss: 0.50474, Gen Loss: 17.11293, Disc Loss: 2.16517, Mono Loss: 0.05381, S2S Loss: 2.09416, SLM Loss: 2.17665
|
52 |
+
INFO:2025-04-19 06:33:54,341: Epoch [177/2000], Step [20/103], Mel Loss: 0.47097, Gen Loss: 21.43686, Disc Loss: 1.55619, Mono Loss: 0.04970, S2S Loss: 2.45769, SLM Loss: 2.14187
|
53 |
+
INFO:2025-04-19 06:34:23,545: Epoch [177/2000], Step [30/103], Mel Loss: 0.46777, Gen Loss: 19.08918, Disc Loss: 1.86984, Mono Loss: 0.01860, S2S Loss: 2.19957, SLM Loss: 2.25150
|
54 |
+
INFO:2025-04-19 06:34:54,276: Epoch [177/2000], Step [40/103], Mel Loss: 0.46588, Gen Loss: 21.29658, Disc Loss: 1.57501, Mono Loss: 0.02686, S2S Loss: 2.71563, SLM Loss: 2.54344
|
55 |
+
INFO:2025-04-19 06:35:25,575: Epoch [177/2000], Step [50/103], Mel Loss: 0.48175, Gen Loss: 17.02888, Disc Loss: 2.12718, Mono Loss: 0.01955, S2S Loss: 2.48846, SLM Loss: 2.29242
|
56 |
+
INFO:2025-04-19 06:35:56,355: Epoch [177/2000], Step [60/103], Mel Loss: 0.49381, Gen Loss: 16.36454, Disc Loss: 2.32740, Mono Loss: 0.01739, S2S Loss: 1.99311, SLM Loss: 2.10335
|
57 |
+
INFO:2025-04-19 06:36:28,222: Epoch [177/2000], Step [70/103], Mel Loss: 0.48940, Gen Loss: 20.71991, Disc Loss: 1.51545, Mono Loss: 0.02215, S2S Loss: 2.12421, SLM Loss: 2.18526
|
58 |
+
INFO:2025-04-19 06:37:01,570: Epoch [177/2000], Step [80/103], Mel Loss: 0.48710, Gen Loss: 20.32706, Disc Loss: 1.61254, Mono Loss: 0.02250, S2S Loss: 2.32215, SLM Loss: 2.25215
|
59 |
+
INFO:2025-04-19 06:37:31,603: Epoch [177/2000], Step [90/103], Mel Loss: 0.49960, Gen Loss: 20.98949, Disc Loss: 1.57459, Mono Loss: 0.02182, S2S Loss: 2.19218, SLM Loss: 2.18602
|
60 |
+
INFO:2025-04-19 06:38:02,066: Epoch [177/2000], Step [100/103], Mel Loss: 0.51424, Gen Loss: 16.88578, Disc Loss: 2.06005, Mono Loss: 0.07569, S2S Loss: 1.97613, SLM Loss: 2.14808
|
61 |
+
INFO:2025-04-19 06:39:12,536: Epoch [178/2000], Step [10/103], Mel Loss: 0.51100, Gen Loss: 20.04249, Disc Loss: 1.70662, Mono Loss: 0.02108, S2S Loss: 2.29320, SLM Loss: 2.22905
|
62 |
+
INFO:2025-04-19 06:39:42,911: Epoch [178/2000], Step [20/103], Mel Loss: 0.50186, Gen Loss: 19.56831, Disc Loss: 2.05372, Mono Loss: 0.01500, S2S Loss: 2.36730, SLM Loss: 2.22509
|
63 |
+
INFO:2025-04-19 06:40:13,082: Epoch [178/2000], Step [30/103], Mel Loss: 0.47079, Gen Loss: 19.21834, Disc Loss: 1.84797, Mono Loss: 0.01643, S2S Loss: 2.42372, SLM Loss: 2.38288
|
64 |
+
INFO:2025-04-19 06:40:40,972: Epoch [178/2000], Step [40/103], Mel Loss: 0.47144, Gen Loss: 17.98199, Disc Loss: 1.87680, Mono Loss: 0.05998, S2S Loss: 1.97469, SLM Loss: 2.31611
|
65 |
+
INFO:2025-04-19 06:41:12,789: Epoch [178/2000], Step [50/103], Mel Loss: 0.49665, Gen Loss: 19.83783, Disc Loss: 1.60737, Mono Loss: 0.01816, S2S Loss: 1.94056, SLM Loss: 2.37035
|
66 |
+
INFO:2025-04-19 06:41:42,558: Epoch [178/2000], Step [60/103], Mel Loss: 0.47993, Gen Loss: 20.99589, Disc Loss: 1.58060, Mono Loss: 0.01886, S2S Loss: 2.00411, SLM Loss: 2.26554
|
67 |
+
INFO:2025-04-19 06:42:14,046: Epoch [178/2000], Step [70/103], Mel Loss: 0.49653, Gen Loss: 20.75497, Disc Loss: 1.51111, Mono Loss: 0.01569, S2S Loss: 2.09578, SLM Loss: 2.23805
|
68 |
+
INFO:2025-04-19 06:42:44,690: Epoch [178/2000], Step [80/103], Mel Loss: 0.49554, Gen Loss: 20.41372, Disc Loss: 1.63891, Mono Loss: 0.02980, S2S Loss: 2.14003, SLM Loss: 2.25515
|
69 |
+
INFO:2025-04-19 06:43:13,618: Epoch [178/2000], Step [90/103], Mel Loss: 0.46177, Gen Loss: 17.74081, Disc Loss: 2.06814, Mono Loss: 0.01958, S2S Loss: 2.33267, SLM Loss: 2.25924
|
70 |
+
INFO:2025-04-19 06:43:44,829: Epoch [178/2000], Step [100/103], Mel Loss: 0.47063, Gen Loss: 19.16476, Disc Loss: 1.95167, Mono Loss: 0.01380, S2S Loss: 2.27418, SLM Loss: 2.16315
|
71 |
+
INFO:2025-04-19 06:44:42,383: Epoch [179/2000], Step [10/103], Mel Loss: 0.48133, Gen Loss: 19.65171, Disc Loss: 1.81837, Mono Loss: 0.01611, S2S Loss: 2.02007, SLM Loss: 2.15730
|
72 |
+
INFO:2025-04-19 06:45:14,826: Epoch [179/2000], Step [20/103], Mel Loss: 0.49343, Gen Loss: 17.33815, Disc Loss: 2.47997, Mono Loss: 0.01305, S2S Loss: 2.07549, SLM Loss: 2.13905
|
73 |
+
INFO:2025-04-19 06:45:45,968: Epoch [179/2000], Step [30/103], Mel Loss: 0.50345, Gen Loss: 19.96809, Disc Loss: 1.86567, Mono Loss: 0.02316, S2S Loss: 2.35168, SLM Loss: 2.21718
|
74 |
+
INFO:2025-04-19 06:46:16,478: Epoch [179/2000], Step [40/103], Mel Loss: 0.51349, Gen Loss: 17.72800, Disc Loss: 2.10020, Mono Loss: 0.01258, S2S Loss: 2.22015, SLM Loss: 2.27779
|
75 |
+
INFO:2025-04-19 06:46:47,978: Epoch [179/2000], Step [50/103], Mel Loss: 0.47499, Gen Loss: 20.26324, Disc Loss: 1.65529, Mono Loss: 0.01757, S2S Loss: 2.14208, SLM Loss: 2.20641
|
76 |
+
INFO:2025-04-19 06:47:17,940: Epoch [179/2000], Step [60/103], Mel Loss: 0.47963, Gen Loss: 18.71129, Disc Loss: 1.98715, Mono Loss: 0.02216, S2S Loss: 2.06452, SLM Loss: 2.44723
|
77 |
+
INFO:2025-04-19 06:47:46,672: Epoch [179/2000], Step [70/103], Mel Loss: 0.46955, Gen Loss: 16.24311, Disc Loss: 2.33695, Mono Loss: 0.04459, S2S Loss: 2.26657, SLM Loss: 2.20270
|
78 |
+
INFO:2025-04-19 06:48:19,554: Epoch [179/2000], Step [80/103], Mel Loss: 0.49098, Gen Loss: 16.58536, Disc Loss: 2.10204, Mono Loss: 0.01451, S2S Loss: 2.36178, SLM Loss: 2.20389
|
79 |
+
INFO:2025-04-19 06:48:49,801: Epoch [179/2000], Step [90/103], Mel Loss: 0.48200, Gen Loss: 19.20991, Disc Loss: 1.70413, Mono Loss: 0.01811, S2S Loss: 2.04987, SLM Loss: 2.27541
|
80 |
+
INFO:2025-04-19 06:49:19,884: Epoch [179/2000], Step [100/103], Mel Loss: 0.48396, Gen Loss: 19.84217, Disc Loss: 1.62315, Mono Loss: 0.02771, S2S Loss: 1.89488, SLM Loss: 2.24688
|
81 |
+
INFO:2025-04-19 06:50:31,289: Epoch [180/2000], Step [10/103], Mel Loss: 0.48818, Gen Loss: 20.37338, Disc Loss: 1.65358, Mono Loss: 0.02379, S2S Loss: 2.01214, SLM Loss: 2.28381
|
82 |
+
INFO:2025-04-19 06:51:02,619: Epoch [180/2000], Step [20/103], Mel Loss: 0.47724, Gen Loss: 20.96991, Disc Loss: 1.54709, Mono Loss: 0.02196, S2S Loss: 1.85579, SLM Loss: 2.19455
|
83 |
+
INFO:2025-04-19 06:51:30,808: Epoch [180/2000], Step [30/103], Mel Loss: 0.47380, Gen Loss: 16.36775, Disc Loss: 2.27467, Mono Loss: 0.09785, S2S Loss: 2.17829, SLM Loss: 2.02525
|
84 |
+
INFO:2025-04-19 06:52:01,719: Epoch [180/2000], Step [40/103], Mel Loss: 0.50057, Gen Loss: 20.71078, Disc Loss: 1.53290, Mono Loss: 0.01963, S2S Loss: 2.49991, SLM Loss: 2.38910
|
85 |
+
INFO:2025-04-19 06:52:33,851: Epoch [180/2000], Step [50/103], Mel Loss: 0.49654, Gen Loss: 19.57065, Disc Loss: 1.76384, Mono Loss: 0.02505, S2S Loss: 2.27472, SLM Loss: 2.14535
|
86 |
+
INFO:2025-04-19 06:53:07,125: Epoch [180/2000], Step [60/103], Mel Loss: 0.49525, Gen Loss: 19.67667, Disc Loss: 1.78827, Mono Loss: 0.02732, S2S Loss: 2.31969, SLM Loss: 2.15537
|
87 |
+
INFO:2025-04-19 06:53:37,750: Epoch [180/2000], Step [70/103], Mel Loss: 0.45083, Gen Loss: 20.67027, Disc Loss: 1.61505, Mono Loss: 0.01881, S2S Loss: 1.93325, SLM Loss: 2.12408
|
88 |
+
INFO:2025-04-19 06:54:08,298: Epoch [180/2000], Step [80/103], Mel Loss: 0.48052, Gen Loss: 19.88732, Disc Loss: 1.58013, Mono Loss: 0.03172, S2S Loss: 1.95051, SLM Loss: 2.24723
|
89 |
+
INFO:2025-04-19 06:54:39,525: Epoch [180/2000], Step [90/103], Mel Loss: 0.48107, Gen Loss: 19.58432, Disc Loss: 1.81857, Mono Loss: 0.01407, S2S Loss: 2.00401, SLM Loss: 2.01524
|
90 |
+
INFO:2025-04-19 06:55:09,864: Epoch [180/2000], Step [100/103], Mel Loss: 0.48382, Gen Loss: 21.15065, Disc Loss: 1.59409, Mono Loss: 0.02166, S2S Loss: 1.97609, SLM Loss: 2.34446
|