Pipe1213's picture
Upload 2 files
cd2d09a verified
raw
history blame
1.04 kB
""" from https://github.com/keithito/tacotron """
'''
Defines the set of symbols used in text input to the model.
'''
#_pad = '_'
_punctuation = '"'
#_numbers = '0123456789'
#_letters = 'ABCÇDEFGHIJKLMNOPQRSTUVWXYZÂÊÎÏÔÛâêîïôûéÉèåÅÈàÀüùÙÌìëöõabcçdefghijklmnopqrstuvwxyz'
#_letters_ipa = "&°ɑɐɒæɓʙβɔɕçɗɖðʤəɘɚɛɜɝɞɟʄɡɠɢʛɦɧħɥʜɨɪʝɭɬɫɮʟɱɯɰŋɳɲɴøɵɸθœɶʘɹɺɾɻʀʁɽʂʃʈʧʉʊʋⱱʌɣɤʍχʎʏʑʐʒʔʡʕʢǀǁǂǃˈˌːˑʼʴʰʱʲʷˠˤ˞↓↑→↗↘'̩'ᵻ"
#_letters_ipa_lisn = " !,./0123456789:?@ACDEILMNOPSUXYZ_abcdefghijklmnoprstuvwxyz|~"
_full_alphabet = " !*&'()+,-./0123456789:;?ABCDEFGHIJKLMNOPQRSTUVWXYZ_abcdefghijklmnopqrstuvwxyz|«°»ÀÂÇÈÉÊÎÏÔÙÛàâæçèéêëîïôöùúûüœ–’“”…ÅåûPRSTVWYZ"
# Export all symbols:
symbols = [_punctuation] + list(_full_alphabet) #[_pad] + list(_punctuation) + list(_letters) + list(_numbers) + list(_letters_ipa)
# Special symbol ids
SPACE_ID = symbols.index(" ")