wavlm-large / s3prl_s3prl_main /s3prl /dataset /speech2phoneme_pipe.py
lmzjms's picture
Upload 1162 files
0b32ad6 verified
raw
history blame contribute delete
620 Bytes
from .base import SequentialDataPipe
from .common_pipes import LoadAudio, Phonemize, SetOutputKeys
class Speech2PhonemePipe(SequentialDataPipe):
"""
each item in the input dataset should have:
wav_path: str
transcription: str
"""
def __init__(self):
output_keys = dict(
x="wav",
x_len="wav_len",
labels="phonemized_text",
class_ids="tokenized_text",
unique_name="id",
)
super().__init__(
LoadAudio(),
Phonemize(),
SetOutputKeys(output_keys=output_keys),
)