testspace / builder /fetch_models.py
StormblessedKal's picture
change device for whisper
96979b3
raw
history blame
369 Bytes
import se_extractor as se
_ = se.generate_voice_segments('openai_source_output.mp3',vad=False)
_ = se.load_model()
from resemble_enhance.enhancer.inference import denoise, enhance
import torchaudio
dwav, sr = torchaudio.load('openai_source_output.mp3')
dwav = dwav.mean(dim=0)
wav1, new_sr = enhance(dwav, sr, 'cuda', nfe=32, solver='midpoint', lambd=0.9, tau=0.5)