File size: 419 Bytes
e1412bc
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
import se_extractor as se

_ = se.generate_voice_segments('openai_source_output.mp3',vad=False)
_ = se.generate_voice_segments('openai_source_output.mp3',vad=True)

from resemble_enhance.enhancer.inference import denoise, enhance
import torchaudio


dwav, sr = torchaudio.load('openai_source_output.mp3')
dwav = dwav.mean(dim=0)

wav1, new_sr = enhance(dwav, sr, 'cuda:0', nfe=32, solver='midpoint', lambd=0.9, tau=0.5)