File size: 871 Bytes
e8bdc47
 
 
 
 
344c204
 
 
 
 
 
e8bdc47
 
344c204
e8bdc47
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
""" from https://github.com/keithito/tacotron """

'''
Defines the set of symbols used in text input to the model.
'''
_pad        = '_'
_punctuation = '+/…;:,.!?¡¿—-–<>*)…"«»“”~̃ '
_numbers = '0123456789'
_letters = 'ABCÇDEFGHIJKLMNOPQRSTUVWXYZÂÊÎÏÔÛâêîïôûéÉèåÅÈàÀüùÙÌìëöõabcçdefghijklmnopqrstuvwxyz'
_letters_ipa = "&°ɑɐɒæɓʙβɔɕçɗɖðʤəɘɚɛɜɝɞɟʄɡɠɢʛɦɧħɥʜɨɪʝɭɬɫɮʟɱɯɰŋɳɲɴøɵɸθœɶʘɹɺɾɻʀʁɽʂʃʈʧʉʊʋⱱʌɣɤʍχʎʏʑʐʒʔʡʕʢǀǁǂǃˈˌːˑʼʴʰʱʲʷˠˤ˞↓↑→↗↘'̩'ᵻ"
#_letters_ipa_lisn = " !,./0123456789:?@ACDEILMNOPSUXYZ_abcdefghijklmnoprstuvwxyz|~"

# Export all symbols:
symbols = [_pad] + list(_punctuation) + list(_letters) + list(_numbers) + list(_letters_ipa) #list(_letters_ipa_lisn)

# Special symbol ids
SPACE_ID = symbols.index(" ")