Spaces:
Paused
Paused
| ''' | |
| Defines the set of symbols used in text input to the model. | |
| ''' | |
| '''# japanese_cleaners | |
| _pad = '_' | |
| _punctuation = ',.!?-' | |
| _letters = 'AEINOQUabdefghijkmnoprstuvwyzʃʧ↓↑ ' | |
| ''' | |
| # japanese_cleaners2 | |
| _pad = '_' | |
| _punctuation = ',.!?-~…' | |
| _letters = 'AEINOQUabdefghijkmnoprstuvwyzʃʧʦ↓↑ ' | |
| ''' | |
| # korean_cleaners | |
| _pad = '_' | |
| _punctuation = ',.!?…~' | |
| _letters = 'ㄱㄴㄷㄹㅁㅂㅅㅇㅈㅊㅋㅌㅍㅎㄲㄸㅃㅆㅉㅏㅓㅗㅜㅡㅣㅐㅔ ' | |
| ''' | |
| '''# chinese_cleaners | |
| _pad = '_' | |
| _punctuation = ',。!?—…' | |
| _letters = 'ㄅㄆㄇㄈㄉㄊㄋㄌㄍㄎㄏㄐㄑㄒㄓㄔㄕㄖㄗㄘㄙㄚㄛㄜㄝㄞㄟㄠㄡㄢㄣㄤㄥㄦㄧㄨㄩˉˊˇˋ˙ ' | |
| ''' | |
| '''# zh_ja_mixture_cleaners | |
| _pad = '_' | |
| _punctuation = ',.!?-~…' | |
| _letters = 'AEINOQUabdefghijklmnoprstuvwyzʃʧʦɯɹəɥ⁼ʰ`→↓↑ ' | |
| ''' | |
| '''# sanskrit_cleaners | |
| _pad = '_' | |
| _punctuation = '।' | |
| _letters = 'ँंःअआइईउऊऋएऐओऔकखगघङचछजझञटठडढणतथदधनपफबभमयरलळवशषसहऽािीुूृॄेैोौ्ॠॢ ' | |
| ''' | |
| '''# cjks_cleaners | |
| _pad = '_' | |
| _punctuation = ',.!?-~…' | |
| _letters = 'NQabdefghijklmnopstuvwxyzʃʧʥʦɯɹəɥçɸɾβŋɦː⁼ʰ`^#*=→↓↑ ' | |
| ''' | |
| '''# thai_cleaners | |
| _pad = '_' | |
| _punctuation = '.!? ' | |
| _letters = 'กขฃคฆงจฉชซฌญฎฏฐฑฒณดตถทธนบปผฝพฟภมยรฤลวศษสหฬอฮฯะัาำิีึืุูเแโใไๅๆ็่้๊๋์' | |
| ''' | |
| '''# cjke_cleaners2 | |
| _pad = '_' | |
| _punctuation = ',.!?-~…' | |
| _letters = 'NQabdefghijklmnopstuvwxyzɑæʃʑçɯɪɔɛɹðəɫɥɸʊɾʒθβŋɦ⁼ʰ`^#*=ˈˌ→↓↑ ' | |
| ''' | |
| '''# shanghainese_cleaners | |
| _pad = '_' | |
| _punctuation = ',.!?…' | |
| _letters = 'abdfghiklmnopstuvyzøŋȵɑɔɕəɤɦɪɿʑʔʰ̩̃ᴀᴇ15678 ' | |
| ''' | |
| '''# chinese_dialect_cleaners | |
| _pad = '_' | |
| _punctuation = ',.!?~…─' | |
| _letters = '#Nabdefghijklmnoprstuvwxyzæçøŋœȵɐɑɒɓɔɕɗɘəɚɛɜɣɤɦɪɭɯɵɷɸɻɾɿʂʅʊʋʌʏʑʔʦʮʰʷˀː˥˦˧˨˩̥̩̃̚αᴀᴇ↑↓∅ⱼ ' | |
| ''' | |
| # Export all symbols: | |
| symbols = [_pad] + list(_punctuation) + list(_letters) | |
| # Special symbol ids | |
| SPACE_ID = symbols.index(" ") | |