Spaces:
Sleeping
Sleeping
Rasmus Lellep
commited on
Commit
·
4ea5559
1
Parent(s):
5a03f53
added more languages
Browse files- app.py +1 -1
- app_local.py +1 -1
- requirements.txt +24 -0
app.py
CHANGED
@@ -61,7 +61,7 @@ demo = gr.Interface(
|
|
61 |
title="XTTSv2-est Demo",
|
62 |
description="To get the best results, provide a reference clip around the same length as the output sentence you want.",
|
63 |
fn=predict,
|
64 |
-
inputs=["text", gr.Dropdown(["et", "en"]), gr.File()],
|
65 |
outputs=[gr.Audio()],
|
66 |
)
|
67 |
|
|
|
61 |
title="XTTSv2-est Demo",
|
62 |
description="To get the best results, provide a reference clip around the same length as the output sentence you want.",
|
63 |
fn=predict,
|
64 |
+
inputs=["text", gr.Dropdown(["et", "en", "es", "fr", "de", "it", "pt", "pl", "tr", "ru", "nl", "cs", "ar", "zh-cn", "hu", "ko", "ja", "hi"]), gr.File()],
|
65 |
outputs=[gr.Audio()],
|
66 |
)
|
67 |
|
app_local.py
CHANGED
@@ -47,7 +47,7 @@ demo = gr.Interface(
|
|
47 |
title="XTTSv2-est Demo",
|
48 |
description="To get the best results, provide a reference clip around the same length as the output sentence you want.",
|
49 |
fn=predict,
|
50 |
-
inputs=["text", gr.Dropdown(["et", "en"]), gr.File()],
|
51 |
outputs=[gr.Audio()],
|
52 |
)
|
53 |
|
|
|
47 |
title="XTTSv2-est Demo",
|
48 |
description="To get the best results, provide a reference clip around the same length as the output sentence you want.",
|
49 |
fn=predict,
|
50 |
+
inputs=["text", gr.Dropdown(["et", "en", "es", "fr", "de", "it", "pt", "pl", "tr", "ru", "nl", "cs", "ar", "zh-cn", "hu", "ko", "ja", "hi"]), gr.File()],
|
51 |
outputs=[gr.Audio()],
|
52 |
)
|
53 |
|
requirements.txt
CHANGED
@@ -16,8 +16,16 @@ fsspec[http]>=2023.6.0
|
|
16 |
aiohttp>=3.8.1
|
17 |
packaging>=23.1
|
18 |
###mutagen==1.47.0
|
|
|
|
|
19 |
# deps for inference
|
20 |
pysbd>=0.3.4
|
|
|
|
|
|
|
|
|
|
|
|
|
21 |
# coqui stack
|
22 |
trainer>=0.0.36
|
23 |
coqui-tts-trainer>=0.2.0,<0.3.0
|
@@ -26,14 +34,30 @@ coqpit-config>=0.1.1,<0.2.0
|
|
26 |
monotonic-alignment-search>=0.1.0
|
27 |
# gruut+supported langs
|
28 |
gruut[de,es,fr]==2.4.0
|
|
|
|
|
|
|
|
|
|
|
|
|
29 |
###nltk
|
30 |
g2pkk>=0.1.1
|
31 |
pip>=22.2
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
32 |
# deps for estonian
|
33 |
tts_preprocess_et @ git+https://github.com/TartuNLP/[email protected]
|
34 |
#deps for tortoise
|
35 |
einops>=0.6.0
|
36 |
transformers>=4.43.0,<=4.46.2
|
|
|
|
|
37 |
# deps for XTTS
|
38 |
###unidecode>=1.3.2
|
39 |
num2words>=0.5.14
|
|
|
16 |
aiohttp>=3.8.1
|
17 |
packaging>=23.1
|
18 |
###mutagen==1.47.0
|
19 |
+
# deps for examples
|
20 |
+
flask>=3.0.0
|
21 |
# deps for inference
|
22 |
pysbd>=0.3.4
|
23 |
+
# deps for notebooks
|
24 |
+
bokeh==1.4.0
|
25 |
+
umap-learn>=0.5.1
|
26 |
+
pandas>=1.4,<2.0
|
27 |
+
# deps for training
|
28 |
+
matplotlib>=3.7.0
|
29 |
# coqui stack
|
30 |
trainer>=0.0.36
|
31 |
coqui-tts-trainer>=0.2.0,<0.3.0
|
|
|
34 |
monotonic-alignment-search>=0.1.0
|
35 |
# gruut+supported langs
|
36 |
gruut[de,es,fr]==2.4.0
|
37 |
+
# chinese g2p deps
|
38 |
+
jieba>=0.42.1
|
39 |
+
pypinyin>=0.40.0
|
40 |
+
# deps for korean
|
41 |
+
hangul_romanize>=0.1.0
|
42 |
+
jamo>=0.4.1
|
43 |
###nltk
|
44 |
g2pkk>=0.1.1
|
45 |
pip>=22.2
|
46 |
+
# deps for bangla
|
47 |
+
bangla>=0.0.2
|
48 |
+
bnnumerizer>=0.0.2
|
49 |
+
bnunicodenormalizer>=0.1.0
|
50 |
+
# deps for japanese
|
51 |
+
mecab-python3>=1.0.2
|
52 |
+
unidic-lite==1.0.8
|
53 |
+
cutlet>=0.2.0
|
54 |
# deps for estonian
|
55 |
tts_preprocess_et @ git+https://github.com/TartuNLP/[email protected]
|
56 |
#deps for tortoise
|
57 |
einops>=0.6.0
|
58 |
transformers>=4.43.0,<=4.46.2
|
59 |
+
#deps for bark
|
60 |
+
encodec>=0.1.1
|
61 |
# deps for XTTS
|
62 |
###unidecode>=1.3.2
|
63 |
num2words>=0.5.14
|