Spaces:

tartuNLP
/

XTTSv2-est

Sleeping

Rasmus Lellep commited on Jul 10

Commit

4ea5559

1 Parent(s): 5a03f53

added more languages

Files changed (3) hide show

app.py CHANGED Viewed

@@ -61,7 +61,7 @@ demo = gr.Interface(
     title="XTTSv2-est Demo",
     description="To get the best results, provide a reference clip around the same length as the output sentence you want.",
     fn=predict,
-    inputs=["text", gr.Dropdown(["et", "en"]), gr.File()],
     outputs=[gr.Audio()],
 )

     title="XTTSv2-est Demo",
     description="To get the best results, provide a reference clip around the same length as the output sentence you want.",
     fn=predict,
+    inputs=["text", gr.Dropdown(["et", "en", "es", "fr", "de", "it", "pt", "pl", "tr", "ru", "nl", "cs", "ar", "zh-cn", "hu", "ko", "ja", "hi"]), gr.File()],
     outputs=[gr.Audio()],
 )

app_local.py CHANGED Viewed

@@ -47,7 +47,7 @@ demo = gr.Interface(
     title="XTTSv2-est Demo",
     description="To get the best results, provide a reference clip around the same length as the output sentence you want.",
     fn=predict,
-    inputs=["text", gr.Dropdown(["et", "en"]), gr.File()],
     outputs=[gr.Audio()],
 )

     title="XTTSv2-est Demo",
     description="To get the best results, provide a reference clip around the same length as the output sentence you want.",
     fn=predict,
+    inputs=["text", gr.Dropdown(["et", "en", "es", "fr", "de", "it", "pt", "pl", "tr", "ru", "nl", "cs", "ar", "zh-cn", "hu", "ko", "ja", "hi"]), gr.File()],
     outputs=[gr.Audio()],
 )

requirements.txt CHANGED Viewed

@@ -16,8 +16,16 @@ fsspec[http]>=2023.6.0
 aiohttp>=3.8.1
 packaging>=23.1
 ###mutagen==1.47.0
 # deps for inference
 pysbd>=0.3.4
 # coqui stack
 trainer>=0.0.36
 coqui-tts-trainer>=0.2.0,<0.3.0
@@ -26,14 +34,30 @@ coqpit-config>=0.1.1,<0.2.0
 monotonic-alignment-search>=0.1.0
 # gruut+supported langs
 gruut[de,es,fr]==2.4.0
 ###nltk
 g2pkk>=0.1.1
 pip>=22.2
 # deps for estonian
 tts_preprocess_et @ git+https://github.com/TartuNLP/[email protected]
 #deps for tortoise
 einops>=0.6.0
 transformers>=4.43.0,<=4.46.2
 # deps for XTTS
 ###unidecode>=1.3.2
 num2words>=0.5.14

 aiohttp>=3.8.1
 packaging>=23.1
 ###mutagen==1.47.0
+# deps for examples
+flask>=3.0.0
 # deps for inference
 pysbd>=0.3.4
+# deps for notebooks
+bokeh==1.4.0
+umap-learn>=0.5.1
+pandas>=1.4,<2.0
+# deps for training
+matplotlib>=3.7.0
 # coqui stack
 trainer>=0.0.36
 coqui-tts-trainer>=0.2.0,<0.3.0
 monotonic-alignment-search>=0.1.0
 # gruut+supported langs
 gruut[de,es,fr]==2.4.0
+# chinese g2p deps
+jieba>=0.42.1
+pypinyin>=0.40.0
+# deps for korean
+hangul_romanize>=0.1.0
+jamo>=0.4.1
 ###nltk
 g2pkk>=0.1.1
 pip>=22.2
+# deps for bangla
+bangla>=0.0.2
+bnnumerizer>=0.0.2
+bnunicodenormalizer>=0.1.0
+# deps for japanese
+mecab-python3>=1.0.2
+unidic-lite==1.0.8
+cutlet>=0.2.0
 # deps for estonian
 tts_preprocess_et @ git+https://github.com/TartuNLP/[email protected]
 #deps for tortoise
 einops>=0.6.0
 transformers>=4.43.0,<=4.46.2
+#deps for bark
+encodec>=0.1.1
 # deps for XTTS
 ###unidecode>=1.3.2
 num2words>=0.5.14