Spaces:

oza75
/

bambara-asr

Sleeping

App Files Files Community

Aboubacar OUATTARA - kaira commited on Apr 26, 2024

Commit

4273f74

1 Parent(s): 589123e

add examples files

Browse files

Files changed (1) hide show

app.py +25 -2

app.py CHANGED Viewed

@@ -1,7 +1,11 @@
 import spaces
 import torch
 from transformers import pipeline
 import gradio as gr
 from bambara_utils import BambaraWhisperTokenizer
 # Determine the appropriate device (GPU or CPU)
@@ -31,15 +35,34 @@ def transcribe(audio):
     text = pipe(audio)["text"]
     return text
 def main():
     # Setup Gradio interface
     iface = gr.Interface(
         fn=transcribe,
-        inputs=gr.Audio(type="filepath"),
         outputs="text",
         title="Bambara Automatic Speech Recognition",
-        description="Realtime demo for Bambara speech recognition based on a fine-tuning of the Whisper model."
     )
     # Launch the interface

+import os
 import spaces
 import torch
 from transformers import pipeline
 import gradio as gr
+# Please note that the below import will override whisper LANGUAGES to add bambara
+# this is not the best way to do it but at least it works. for more info check the bambara_utils code
 from bambara_utils import BambaraWhisperTokenizer
 # Determine the appropriate device (GPU or CPU)
     text = pipe(audio)["text"]
     return text
+def get_wav_files(directory):
+    """
+    Returns a list of absolute paths to all .wav files in the specified directory.
+    Args:
+        directory (str): The directory to search for .wav files.
+    Returns:
+        list: A list of absolute paths to the .wav files.
+    """
+    # List all files in the directory
+    files = os.listdir(directory)
+    # Filter for .wav files and create absolute paths
+    wav_files = [os.path.abspath(os.path.join(directory, file)) for file in files if file.endswith('.wav')]
+    return wav_files
 def main():
+    # Get a list of all .wav files in the examples directory
+    example_files = get_wav_files("./examples")
     # Setup Gradio interface
     iface = gr.Interface(
         fn=transcribe,
+        inputs=gr.Audio(type="filepath", value=example_files[0]),
         outputs="text",
         title="Bambara Automatic Speech Recognition",
+        description="Realtime demo for Bambara speech recognition based on a fine-tuning of the Whisper model.",
+        examples=example_files,
     )
     # Launch the interface