|
''' |
|
Defines the set of symbols used in text input to the model. |
|
''' |
|
|
|
'''# japanese_cleaners |
|
_pad = '_' |
|
_punctuation = ',.!?-' |
|
_letters = 'AEINOQUabdefghijkmnoprstuvwyzʃʧ↓↑ ' |
|
''' |
|
|
|
|
|
_pad = '_' |
|
_punctuation = ',.!?-~…' |
|
_letters = 'AEINOQUabdefghijkmnoprstuvwyzʃʧʦ↓↑ ' |
|
|
|
|
|
'''# korean_cleaners |
|
_pad = '_' |
|
_punctuation = ',.!?…~' |
|
_letters = 'ㄱㄴㄷㄹㅁㅂㅅㅇㅈㅊㅋㅌㅍㅎㄲㄸㅃㅆㅉㅏㅓㅗㅜㅡㅣㅐㅔ ' |
|
''' |
|
|
|
'''# chinese_cleaners |
|
_pad = '_' |
|
_punctuation = ',。!?—…' |
|
_letters = 'ㄅㄆㄇㄈㄉㄊㄋㄌㄍㄎㄏㄐㄑㄒㄓㄔㄕㄖㄗㄘㄙㄚㄛㄜㄝㄞㄟㄠㄡㄢㄣㄤㄥㄦㄧㄨㄩˉˊˇˋ˙ ' |
|
''' |
|
|
|
'''# zh_ja_mixture_cleaners |
|
_pad = '_' |
|
_punctuation = ',.!?-~…' |
|
_letters = 'AEINOQUabdefghijklmnoprstuvwyzʃʧʦɯɹəɥ⁼ʰ`→↓↑ ' |
|
''' |
|
|
|
'''# sanskrit_cleaners |
|
_pad = '_' |
|
_punctuation = '।' |
|
_letters = 'ँंःअआइईउऊऋएऐओऔकखगघङचछजझञटठडढणतथदधनपफबभमयरलळवशषसहऽािीुूृॄेैोौ्ॠॢ ' |
|
''' |
|
|
|
'''# cjks_cleaners |
|
_pad = '_' |
|
_punctuation = ',.!?-~…' |
|
_letters = 'NQabdefghijklmnopstuvwxyzʃʧʥʦɯɹəɥçɸɾβŋɦː⁼ʰ`^#*=→↓↑ ' |
|
''' |
|
|
|
'''# thai_cleaners |
|
_pad = '_' |
|
_punctuation = '.!? ' |
|
_letters = 'กขฃคฆงจฉชซฌญฎฏฐฑฒณดตถทธนบปผฝพฟภมยรฤลวศษสหฬอฮฯะัาำิีึืุูเแโใไๅๆ็่้๊๋์' |
|
''' |
|
|
|
'''# cjke_cleaners2 |
|
_pad = '_' |
|
_punctuation = ',.!?-~…' |
|
_letters = 'NQabdefghijklmnopstuvwxyzɑæʃʑçɯɪɔɛɹðəɫɥɸʊɾʒθβŋɦ⁼ʰ`^#*=ˈˌ→↓↑ ' |
|
''' |
|
|
|
'''# shanghainese_cleaners |
|
_pad = '_' |
|
_punctuation = ',.!?…' |
|
_letters = 'abdfghiklmnopstuvyzøŋȵɑɔɕəɤɦɪɿʑʔʰ̩̃ᴀᴇ15678 ' |
|
''' |
|
|
|
'''# chinese_dialect_cleaners |
|
_pad = '_' |
|
_punctuation = ',.!?~…─' |
|
_letters = '#Nabdefghijklmnoprstuvwxyzæçøŋœȵɐɑɒɓɔɕɗɘəɚɛɜɣɤɦɪɭɯɵɷɸɻɾɿʂʅʊʋʌʏʑʔʦʮʰʷˀː˥˦˧˨˩̥̩̃̚ᴀᴇ↑↓∅ⱼ ' |
|
''' |
|
|
|
|
|
symbols = [_pad] + list(_punctuation) + list(_letters) |
|
|
|
|
|
SPACE_ID = symbols.index(" ") |
|
|