File size: 1,418 Bytes
223aff6
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
""" from https://github.com/keithito/tacotron """
from loguru import logger
# from app.config import Config
from . import cleaners

_symbol_to_id = None

def text_to_sequence(text, symbols, cleaner_names):
    '''Converts a string of text to a sequence of IDs corresponding to the symbols in the text.

      Args:

        text: string to convert to a sequence

        symbols: list of symbols in the text

        cleaner_names: names of the cleaner functions to run the text through

      Returns:

        List of integers corresponding to the symbols in the text





        ATTENTION: unable to access Config variabel , don't know why

    '''

    global _symbol_to_id


    if not _symbol_to_id:
        _symbol_to_id = {s: i for i, s in enumerate(symbols)}

 

    clean_text = _clean_text(text, cleaner_names)

    sequence = [
        _symbol_to_id[symbol] for symbol in clean_text if symbol in _symbol_to_id.keys()
    ]

    # for symbol in clean_text:
    #     if symbol not in _symbol_to_id.keys():
    #         continue
    #     symbol_id = _symbol_to_id[symbol]
    #     sequence += [symbol_id]
    return sequence


def _clean_text(text, cleaner_names):
    for name in cleaner_names:
        cleaner = getattr(cleaners, name)
        if not cleaner:
            raise Exception('Unknown cleaner: %s' % name)
        text = cleaner(text)
    return text