File size: 2,901 Bytes
7c16a3b
 
 
 
 
 
 
 
 
 
6e5a1f8
7c16a3b
4960bfb
7c16a3b
 
 
 
 
 
 
 
 
 
7ceb3b6
7c16a3b
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
4c8411c
7c16a3b
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
import gradio as gr

import os

from gradio_client import Client

from dotenv import load_dotenv
load_dotenv()


HF_TOKEN = os.environ['hf_token']

client = Client("Ghana-NLP/Northern-Ghana-TTS",hf_token=HF_TOKEN)

def synthesize(text, lang, speaker):
    audio = result = client.predict(
        text=text,
		lang=lang,
		speaker=speaker,
		api_name="/predict")
    return audio


title = "Khaya AI: Speech Synthesis for Northern Ghanaian Languages"

description = """
<b>How to use:</b> Enter some text and choose a language and speaker.
"""

examples = [
    ["Nɛ malaika na kaŋɛ bumo: “Men sa maa lɔ kufu, ŋkpal manɛ so, baru lela nɛ k beeŋ sa basa kikɛ kagbenefuli nɛ m bar menyi.", "Gonja","Female"],
    ["Kumo to be ndibi be ayabi bee wɔl nna a buri a tɔr nɛ beche bee kil amo a puga edɛ. Ŋkpal basa na ka maŋ pin asheŋ to na so, Ebɔrɛ nɛ e to bumo na maaŋ wu bumo kuwɔr ŋko n shu bumo so.", "Gonja","Male (Low)"],
    ["Di saha ka niriba anaasi daa zi gbariga m-paai na.", "Mampruli","Female"],
    ["Ka Yisa daa nya ka u ma n zɛya, ŋↄn ni u nyaandↄlisↄ ŋↄn daa wuri pam la gba. Ka u yɛli u ma maa, ni, <<Nyama, m ma, i bii nŋↄa.>>", "Mampruli","Male (Low)"],
    ["Abena mɔ mɛ. A dugԑ la dinu’uma bɔ ma dee le pee dugerɔ la laasi la amiŋa.", "Gurene","Female"],
    ["Budaa la zԑ̃kԑ bugundɔɔ la paԑ la ka gbe’ere beene dee dĩ’ԑ ŋmi’a zi’an la.", "Gurene","Male (Low)"],
    ["Dagbamba nyɛla zuliya ban be tudu yaɣili. Dagbamba ni yɛri bal'shɛli n nyɛ dagbanli.", "Dagbani","Female"],
    ["Ka o daa bahi kpi lala Ashibiti titali maa ni silimiin-gɔli November biɛɣ' pia ni ayɔbu dali.", "Dagbani","Male (Low)"],
    ["Bana la ka ba maŋ wullo tegitegilɛ kyɛ ka ba daŋ ba baŋ a yelmeŋɛ.", "Dagaare","Female"],
    ["O da yeli ko la a banaŋ naŋ da koɔrɔ a ŋmama, “Yɛ de a boma ŋa yi te bare! Yɛ ta de a N Saa yiri ka o leɛ yɛ daa diibu zie!”", "Dagaare","Male (Low)"],
    ["Ka bo ka m na niŋ yʋ'ʋse? M na pʋ'ʋs nɛ m siig ka me lem pʋ'ʋs nɛ m ya'am, ka yum nɛ m siig ka mɛ lɛn yum nɛ m ya'am.", "Kusaal", "Female"],
    ["Ban daa nyɛ nwadibil la, ka ba sʋnya ma'ae. Ka ba maal sumalisim bɛdegʋ.", "Kusaal", "Male (Low)"],
    ["And this model speaks English in a West African accent too, if you can believe that.", "English","Female"],
]

gr.Interface(
    fn=synthesize,
    inputs=[
        gr.Text(label="Input Text"),
        gr.Dropdown(
            label="Select Language",
            choices=["Dagaare","Dagbani","Gonja","Gurene","Kusaal","Mampruli","English"],
            value="Dagbani",
        ),
        gr.Radio(label="Speaker", choices=['Female', 'Male (Low)', 'Male (High)'],
        value="Female"),
    ],
    outputs=[
        gr.Audio(label="Generated Speech", type="numpy"),
    ],
    title=title,
    description=description,
    examples=examples,
).launch()