audioseal_watermark_detection

Sleeping

Kabatubare commited on Feb 29, 2024

Commit

4e2a28d

verified ·

1 Parent(s): 9ffef8e

Update

Files changed (1) hide show

app.py CHANGED Viewed

@@ -15,6 +15,15 @@ except ImportError as e:
     audioseal_available = False
     print(f"AudioSeal could not be imported: {e}")
 def extract_mfcc_features(waveform, sample_rate, n_mfcc=40, n_mels=128, win_length=400, hop_length=160):
     mfcc_transform = T.MFCC(
         sample_rate=sample_rate,
@@ -44,6 +53,11 @@ def plot_spectrogram(waveform, sample_rate):
     buf.seek(0)
     return Image.open(buf)
 def detect_watermark(waveform, sample_rate):
     """Detect watermark in the uploaded audio using AudioSeal."""
     if audioseal_available:
@@ -87,4 +101,3 @@ interface = gr.Interface(
 if __name__ == "__main__":
     interface.launch()

     audioseal_available = False
     print(f"AudioSeal could not be imported: {e}")
+def load_and_resample_audio(audio_file_path, target_sample_rate=16000):
+    waveform, sample_rate = torchaudio.load(audio_file_path)
+    # Check if the audio needs to be resampled
+    if sample_rate != target_sample_rate:
+        resampler = torchaudio.transforms.Resample(orig_freq=sample_rate, new_freq=target_sample_rate)
+        waveform = resampler(waveform)
+    return waveform, target_sample_rate
 def extract_mfcc_features(waveform, sample_rate, n_mfcc=40, n_mels=128, win_length=400, hop_length=160):
     mfcc_transform = T.MFCC(
         sample_rate=sample_rate,
     buf.seek(0)
     return Image.open(buf)
+    audio_file_path = "path_to_your_audio_file.wav"
+    waveform, resampled_sr = load_and_resample_audio(audio_file_path)
+    detect_watermark(waveform, resampled_sr)
 def detect_watermark(waveform, sample_rate):
     """Detect watermark in the uploaded audio using AudioSeal."""
     if audioseal_available:
 if __name__ == "__main__":
     interface.launch()