Zw07 commited on
Commit
3c6d125
·
verified ·
1 Parent(s): 4e90fee

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +8 -2
app.py CHANGED
@@ -12,6 +12,7 @@ import torchaudio
12
  from pydub import AudioSegment
13
  import io
14
  import librosa
 
15
  # import numpy
16
 
17
  # def my_read_file(audio_path, max_second):
@@ -105,9 +106,14 @@ def main():
105
  wav= wav.unsqueeze(0)
106
 
107
  elif file_extension == ".mp3":
108
- torchaudio.set_audio_backend("ffmpeg")
 
 
 
 
 
109
  #wav3, sample_rate = librosa.load("test.mp3")
110
- wav3, sample_rate = torchaudio.load("test.mp3")
111
  st.markdown(wav3)
112
  #RuntimeError: Could not infer dtype of numpy.float32
113
  #wav = torch.tensor(wav3).float() / 32768.0
 
12
  from pydub import AudioSegment
13
  import io
14
  import librosa
15
+ from torchaudio.io import CodecConfig
16
  # import numpy
17
 
18
  # def my_read_file(audio_path, max_second):
 
106
  wav= wav.unsqueeze(0)
107
 
108
  elif file_extension == ".mp3":
109
+
110
+ # Switch to FFmpeg backend
111
+ torchaudio.set_audio_backend("sox")
112
+
113
+ # Define CodecConfig for MP3 compression
114
+ #codec_config = CodecConfig(format="mp3", compression=128) # 128 kbps for MP3
115
  #wav3, sample_rate = librosa.load("test.mp3")
116
+ wav3, sample_rate = torchaudio.load("test.mp3",compression =-4.5)
117
  st.markdown(wav3)
118
  #RuntimeError: Could not infer dtype of numpy.float32
119
  #wav = torch.tensor(wav3).float() / 32768.0