File size: 583 Bytes
335eff1
49464b8
 
335eff1
0f06115
49464b8
335eff1
0f06115
49464b8
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
import os
from pyannote.audio import Model
from pyannote.audio.pipelines import VoiceActivityDetection
hf_token = os.environ.get("HF_TOKEN")

model = Model.from_pretrained("pyannote/segmentation", 
                              use_auth_token=hf_token)


vad_pipeline = VoiceActivityDetection(segmentation=model)
HYPER_PARAMETERS = {
  "onset": 0.5, "offset": 0.5,
  "min_duration_on": 0.0,
  "min_duration_off": 0.0
}

vad_pipeline.instantiate(HYPER_PARAMETERS)
def vad_segmentation(input_path, output_path, aggressiveness=2):
    return vad_pipeline(input_path)