File size: 1,035 Bytes
cd2d09a
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
""" from https://github.com/keithito/tacotron """

'''
Defines the set of symbols used in text input to the model.
'''
#_pad        = '_'
_punctuation = '"'
#_numbers = '0123456789'
#_letters = 'ABCÇDEFGHIJKLMNOPQRSTUVWXYZÂÊÎÏÔÛâêîïôûéÉèåÅÈàÀüùÙÌìëöõabcçdefghijklmnopqrstuvwxyz'
#_letters_ipa = "&°ɑɐɒæɓʙβɔɕçɗɖðʤəɘɚɛɜɝɞɟʄɡɠɢʛɦɧħɥʜɨɪʝɭɬɫɮʟɱɯɰŋɳɲɴøɵɸθœɶʘɹɺɾɻʀʁɽʂʃʈʧʉʊʋⱱʌɣɤʍχʎʏʑʐʒʔʡʕʢǀǁǂǃˈˌːˑʼʴʰʱʲʷˠˤ˞↓↑→↗↘'̩'ᵻ"
#_letters_ipa_lisn = " !,./0123456789:?@ACDEILMNOPSUXYZ_abcdefghijklmnoprstuvwxyz|~"
_full_alphabet = " !*&'()+,-./0123456789:;?ABCDEFGHIJKLMNOPQRSTUVWXYZ_abcdefghijklmnopqrstuvwxyz|«°»ÀÂÇÈÉÊÎÏÔÙÛàâæçèéêëîïôöùúûüœ–’“”…ÅåûPRSTVWYZ"
# Export all symbols:
symbols = [_punctuation] + list(_full_alphabet) #[_pad] + list(_punctuation) + list(_letters) + list(_numbers) + list(_letters_ipa)

# Special symbol ids
SPACE_ID = symbols.index(" ")