File size: 583 Bytes
335eff1 49464b8 335eff1 0f06115 49464b8 335eff1 0f06115 49464b8 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 |
import os
from pyannote.audio import Model
from pyannote.audio.pipelines import VoiceActivityDetection
hf_token = os.environ.get("HF_TOKEN")
model = Model.from_pretrained("pyannote/segmentation",
use_auth_token=hf_token)
vad_pipeline = VoiceActivityDetection(segmentation=model)
HYPER_PARAMETERS = {
"onset": 0.5, "offset": 0.5,
"min_duration_on": 0.0,
"min_duration_off": 0.0
}
vad_pipeline.instantiate(HYPER_PARAMETERS)
def vad_segmentation(input_path, output_path, aggressiveness=2):
return vad_pipeline(input_path)
|