File size: 742 Bytes
0cecb96 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 |
from speechbrain.pretrained import SpectralMaskEnhancement
import torchaudio
model = SpectralMaskEnhancement.from_hparams(source="speechbrain/metricgan-plus-voicebank", )
from speechbrain.pretrained import SpectralMaskEnhancement
import torchaudio
import torch
model = SpectralMaskEnhancement.from_hparams(source="speechbrain/metricgan-plus-voicebank")
def remove_noise(input_path, output_path):
enhanced = model.enhance_file(input_path)
waveform, sample_rate = enhanced
if waveform.dim() == 0:
raise ValueError(f"Enhanced waveform is empty for file: {input_path}")
elif waveform.dim() == 1:
waveform = waveform.unsqueeze(0)
torchaudio.save(output_path, waveform, sample_rate)
|