from .base import SequentialDataPipe | |
from .common_pipes import LoadAudio, Phonemize, SetOutputKeys | |
class Speech2PhonemePipe(SequentialDataPipe): | |
""" | |
each item in the input dataset should have: | |
wav_path: str | |
transcription: str | |
""" | |
def __init__(self): | |
output_keys = dict( | |
x="wav", | |
x_len="wav_len", | |
labels="phonemized_text", | |
class_ids="tokenized_text", | |
unique_name="id", | |
) | |
super().__init__( | |
LoadAudio(), | |
Phonemize(), | |
SetOutputKeys(output_keys=output_keys), | |
) | |