Spaces:
Runtime error
Runtime error
update wav configs
Browse files- server/preprocess.py +6 -4
server/preprocess.py
CHANGED
@@ -4,7 +4,9 @@ Util functions to process any incoming audio data to be processable by the model
|
|
4 |
import torch
|
5 |
import torchaudio
|
6 |
|
7 |
-
|
|
|
|
|
8 |
wav, sample_rate = torchaudio.load(filename)
|
9 |
|
10 |
wav = process_raw_wav(wav, sample_rate, target_sample_rate, wav_length)
|
@@ -13,7 +15,7 @@ def process_from_filename(filename, target_sample_rate=4800, wav_length=5):
|
|
13 |
|
14 |
return spec
|
15 |
|
16 |
-
def process_raw_wav(wav, sample_rate, target_sample_rate=
|
17 |
num_samples = wav_length * target_sample_rate
|
18 |
|
19 |
wav = _resample(wav, sample_rate, target_sample_rate)
|
@@ -26,9 +28,9 @@ def process_raw_wav(wav, sample_rate, target_sample_rate=4800, wav_length=5):
|
|
26 |
def _wav_to_spec(wav, target_sample_rate):
|
27 |
mel_spectrogram = torchaudio.transforms.MelSpectrogram(
|
28 |
sample_rate=target_sample_rate,
|
29 |
-
n_fft=
|
30 |
hop_length=512,
|
31 |
-
n_mels=
|
32 |
)
|
33 |
|
34 |
return mel_spectrogram(wav)
|
|
|
4 |
import torch
|
5 |
import torchaudio
|
6 |
|
7 |
+
DEFAULT_SAMPLE_RATE=48000
|
8 |
+
|
9 |
+
def process_from_filename(filename, target_sample_rate=DEFAULT_SAMPLE_RATE, wav_length=5):
|
10 |
wav, sample_rate = torchaudio.load(filename)
|
11 |
|
12 |
wav = process_raw_wav(wav, sample_rate, target_sample_rate, wav_length)
|
|
|
15 |
|
16 |
return spec
|
17 |
|
18 |
+
def process_raw_wav(wav, sample_rate=DEFAULT_SAMPLE_RATE, target_sample_rate=DEFAULT_SAMPLE_RATE, wav_length=5):
|
19 |
num_samples = wav_length * target_sample_rate
|
20 |
|
21 |
wav = _resample(wav, sample_rate, target_sample_rate)
|
|
|
28 |
def _wav_to_spec(wav, target_sample_rate):
|
29 |
mel_spectrogram = torchaudio.transforms.MelSpectrogram(
|
30 |
sample_rate=target_sample_rate,
|
31 |
+
n_fft=2048,
|
32 |
hop_length=512,
|
33 |
+
n_mels=128,
|
34 |
)
|
35 |
|
36 |
return mel_spectrogram(wav)
|