Update app.py
Browse files
app.py
CHANGED
@@ -12,6 +12,7 @@ import torchaudio
|
|
12 |
from pydub import AudioSegment
|
13 |
import io
|
14 |
import librosa
|
|
|
15 |
# import numpy
|
16 |
|
17 |
# def my_read_file(audio_path, max_second):
|
@@ -105,9 +106,14 @@ def main():
|
|
105 |
wav= wav.unsqueeze(0)
|
106 |
|
107 |
elif file_extension == ".mp3":
|
108 |
-
|
|
|
|
|
|
|
|
|
|
|
109 |
#wav3, sample_rate = librosa.load("test.mp3")
|
110 |
-
wav3, sample_rate = torchaudio.load("test.mp3")
|
111 |
st.markdown(wav3)
|
112 |
#RuntimeError: Could not infer dtype of numpy.float32
|
113 |
#wav = torch.tensor(wav3).float() / 32768.0
|
|
|
12 |
from pydub import AudioSegment
|
13 |
import io
|
14 |
import librosa
|
15 |
+
from torchaudio.io import CodecConfig
|
16 |
# import numpy
|
17 |
|
18 |
# def my_read_file(audio_path, max_second):
|
|
|
106 |
wav= wav.unsqueeze(0)
|
107 |
|
108 |
elif file_extension == ".mp3":
|
109 |
+
|
110 |
+
# Switch to FFmpeg backend
|
111 |
+
torchaudio.set_audio_backend("sox")
|
112 |
+
|
113 |
+
# Define CodecConfig for MP3 compression
|
114 |
+
#codec_config = CodecConfig(format="mp3", compression=128) # 128 kbps for MP3
|
115 |
#wav3, sample_rate = librosa.load("test.mp3")
|
116 |
+
wav3, sample_rate = torchaudio.load("test.mp3",compression =-4.5)
|
117 |
st.markdown(wav3)
|
118 |
#RuntimeError: Could not infer dtype of numpy.float32
|
119 |
#wav = torch.tensor(wav3).float() / 32768.0
|