File size: 775 Bytes
2ac71d3
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
"""
Defines the set of symbols used in text input to the model.

The default is a set of ASCII characters that works well for English or text that has been run
through Unidecode. For other data, you can modify _characters. See TRAINING_DATA.md for details.
"""
# from . import cmudict
from .korean import ALL_SYMBOLS, PAD, EOS


# For english
en_symbols = PAD+EOS+'ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz!\'(),-.:;? '  #<-For deployment(Because korean ALL_SYMBOLS follow this convention)

symbols = ALL_SYMBOLS # for korean
# 
# # Prepend "@" to ARPAbet symbols to ensure uniqueness (some are the same as uppercase letters):
# #_arpabet = ["@' + s for s in cmudict.valid_symbols]
# 
# # Export all symbols:
# symbols = [PAD, EOS] + list(_characters) #+ _arpabet