|
'''
|
|
Defines the set of symbols used in text input to the model.
|
|
'''
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
'''# japanese_cleaners2
|
|
_pad = '_'
|
|
_punctuation = ',.!?-~…'
|
|
_letters = 'AEINOQUabdefghijkmnoprstuvwyzʃʧʦ↓↑ '
|
|
'''
|
|
|
|
|
|
'''# korean_cleaners
|
|
_pad = '_'
|
|
_punctuation = ',.!?…~'
|
|
_letters = 'ㄱㄴㄷㄹㅁㅂㅅㅇㅈㅊㅋㅌㅍㅎㄲㄸㅃㅆㅉㅏㅓㅗㅜㅡㅣㅐㅔ '
|
|
'''
|
|
|
|
'''# chinese_cleaners
|
|
_pad = '_'
|
|
_punctuation = ',。!?—…'
|
|
_letters = 'ㄅㄆㄇㄈㄉㄊㄋㄌㄍㄎㄏㄐㄑㄒㄓㄔㄕㄖㄗㄘㄙㄚㄛㄜㄝㄞㄟㄠㄡㄢㄣㄤㄥㄦㄧㄨㄩˉˊˇˋ˙ '
|
|
'''
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
'''# sanskrit_cleaners
|
|
_pad = '_'
|
|
_punctuation = '।'
|
|
_letters = 'ँंःअआइईउऊऋएऐओऔकखगघङचछजझञटठडढणतथदधनपफबभमयरलळवशषसहऽािीुूृॄेैोौ्ॠॢ '
|
|
'''
|
|
|
|
'''# cjks_cleaners
|
|
_pad = '_'
|
|
_punctuation = ',.!?-~…'
|
|
_letters = 'NQabdefghijklmnopstuvwxyzʃʧʥʦɯɹəɥçɸɾβŋɦː⁼ʰ`^#*=→↓↑ '
|
|
'''
|
|
|
|
'''# thai_cleaners
|
|
_pad = '_'
|
|
_punctuation = '.!? '
|
|
_letters = 'กขฃคฆงจฉชซฌญฎฏฐฑฒณดตถทธนบปผฝพฟภมยรฤลวศษสหฬอฮฯะัาำิีึืุูเแโใไๅๆ็่้๊๋์'
|
|
'''
|
|
|
|
|
|
_pad = '_'
|
|
_punctuation = ',.!?-~…'
|
|
_letters = 'NQabdefghijklmnopstuvwxyzɑæʃʑçɯɪɔɛɹðəɫɥɸʊɾʒθβŋɦ⁼ʰ`^#*=ˈˌ→↓↑ '
|
|
|
|
|
|
'''# shanghainese_cleaners
|
|
_pad = '_'
|
|
_punctuation = ',.!?…'
|
|
_letters = 'abdfghiklmnopstuvyzøŋȵɑɔɕəɤɦɪɿʑʔʰ̩̃ᴀᴇ15678 '
|
|
'''
|
|
|
|
'''# chinese_dialect_cleaners
|
|
_pad = '_'
|
|
_punctuation = ',.!?~…─'
|
|
_letters = '#Nabdefghijklmnoprstuvwxyzæçøŋœȵɐɑɒɓɔɕɗɘəɚɛɜɣɤɦɪɭɯɵɷɸɻɾɿʂʅʊʋʌʏʑʔʦʮʰʷˀː˥˦˧˨˩̥̩̃̚ᴀᴇ↑↓∅ⱼ '
|
|
'''
|
|
|
|
|
|
symbols = [_pad] + list(_punctuation) + list(_letters)
|
|
|
|
|
|
SPACE_ID = symbols.index(" ")
|
|
|