Spaces:

atlasia
/

Moroccan-Fast-Speech-to-Text-Transcription

Running on Zero

App Files Files Community

BounharAbdelaziz commited on 28 days ago

Commit

1e9de44

verified ·

1 Parent(s): 1e4f628

v0.1: removed save to eval dataset for now

Browse files

Files changed (1) hide show

utils.py +12 -2

utils.py CHANGED Viewed

@@ -15,10 +15,15 @@ from datasets import (
     Audio,
 )
 # Hugging Face evaluation dataset
 HF_DATASET_NAME = "BounharAbdelaziz/Moroccan-STT-Eval-Dataset"
 # Models paths
 MODEL_PATHS = {
     "NANO": "BounharAbdelaziz/Morocco-Darija-STT-tiny",
@@ -26,6 +31,9 @@ MODEL_PATHS = {
     "LARGE": "BounharAbdelaziz/Morocco-Darija-STT-large-v1.2",
 }
 # Access token to models
 STT_MODEL_TOKEN = os.environ.get("STT_MODEL_TOKEN")
@@ -56,7 +64,6 @@ def create_html_image(image_path):
     """
     return html_string
 # ---------------------------------------------------------------------------- #
 # ---------------------------------------------------------------------------- #
@@ -105,6 +112,9 @@ def load_model(model_name):
 # ---------------------------------------------------------------------------- #
 def process_audio(audio, model_choice, save_data):
     pipe = load_model(model_choice)
     audio_signal = audio[1]
     sample_rate = audio[0]
@@ -161,7 +171,7 @@ def create_interface():
         with gr.Row():
             save_data = gr.Checkbox(
                 label="Contribute to the evaluation benchmark",
-                value=True
             )
         submit_btn = gr.Button("Transcribe 🔥")

     Audio,
 )
+# ---------------------------------------------------------------------------- #
+# ---------------------------------------------------------------------------- #
 # Hugging Face evaluation dataset
 HF_DATASET_NAME = "BounharAbdelaziz/Moroccan-STT-Eval-Dataset"
+# ---------------------------------------------------------------------------- #
+# ---------------------------------------------------------------------------- #
 # Models paths
 MODEL_PATHS = {
     "NANO": "BounharAbdelaziz/Morocco-Darija-STT-tiny",
     "LARGE": "BounharAbdelaziz/Morocco-Darija-STT-large-v1.2",
 }
+# ---------------------------------------------------------------------------- #
+# ---------------------------------------------------------------------------- #
 # Access token to models
 STT_MODEL_TOKEN = os.environ.get("STT_MODEL_TOKEN")
     """
     return html_string
 # ---------------------------------------------------------------------------- #
 # ---------------------------------------------------------------------------- #
 # ---------------------------------------------------------------------------- #
 def process_audio(audio, model_choice, save_data):
+    # Force to false for now, issue with dataset
+    save_data = False
     pipe = load_model(model_choice)
     audio_signal = audio[1]
     sample_rate = audio[0]
         with gr.Row():
             save_data = gr.Checkbox(
                 label="Contribute to the evaluation benchmark",
+                value=False,
             )
         submit_btn = gr.Button("Transcribe 🔥")