amanmibra commited on
Commit
5fb3738
·
1 Parent(s): 29b2c35

update wav configs

Browse files
Files changed (1) hide show
  1. server/preprocess.py +6 -4
server/preprocess.py CHANGED
@@ -4,7 +4,9 @@ Util functions to process any incoming audio data to be processable by the model
4
  import torch
5
  import torchaudio
6
 
7
- def process_from_filename(filename, target_sample_rate=4800, wav_length=5):
 
 
8
  wav, sample_rate = torchaudio.load(filename)
9
 
10
  wav = process_raw_wav(wav, sample_rate, target_sample_rate, wav_length)
@@ -13,7 +15,7 @@ def process_from_filename(filename, target_sample_rate=4800, wav_length=5):
13
 
14
  return spec
15
 
16
- def process_raw_wav(wav, sample_rate, target_sample_rate=4800, wav_length=5):
17
  num_samples = wav_length * target_sample_rate
18
 
19
  wav = _resample(wav, sample_rate, target_sample_rate)
@@ -26,9 +28,9 @@ def process_raw_wav(wav, sample_rate, target_sample_rate=4800, wav_length=5):
26
  def _wav_to_spec(wav, target_sample_rate):
27
  mel_spectrogram = torchaudio.transforms.MelSpectrogram(
28
  sample_rate=target_sample_rate,
29
- n_fft=1024,
30
  hop_length=512,
31
- n_mels=64
32
  )
33
 
34
  return mel_spectrogram(wav)
 
4
  import torch
5
  import torchaudio
6
 
7
+ DEFAULT_SAMPLE_RATE=48000
8
+
9
+ def process_from_filename(filename, target_sample_rate=DEFAULT_SAMPLE_RATE, wav_length=5):
10
  wav, sample_rate = torchaudio.load(filename)
11
 
12
  wav = process_raw_wav(wav, sample_rate, target_sample_rate, wav_length)
 
15
 
16
  return spec
17
 
18
+ def process_raw_wav(wav, sample_rate=DEFAULT_SAMPLE_RATE, target_sample_rate=DEFAULT_SAMPLE_RATE, wav_length=5):
19
  num_samples = wav_length * target_sample_rate
20
 
21
  wav = _resample(wav, sample_rate, target_sample_rate)
 
28
  def _wav_to_spec(wav, target_sample_rate):
29
  mel_spectrogram = torchaudio.transforms.MelSpectrogram(
30
  sample_rate=target_sample_rate,
31
+ n_fft=2048,
32
  hop_length=512,
33
+ n_mels=128,
34
  )
35
 
36
  return mel_spectrogram(wav)