Spaces:

alakxender
/

dhivehi-mms-demo

Running on Zero

App Files Files Community

alakxender commited on Feb 7

Commit

700fda9

1 Parent(s): dee3b49

u1

Browse files

Files changed (1) hide show

app.py +26 -7

app.py CHANGED Viewed

@@ -63,14 +63,33 @@ def transcribe(audio_file):
         return f"Error during transcription: {str(e)}"
 # Create Gradio interface
-iface = gr.Interface(
     fn=transcribe,
-    inputs=gr.Audio(type="filepath"),
-    outputs="text",
-    title="Dhivehi Speech Recognition with Language Model",
-    description="Upload an audio file to transcribe Dhivehi speech to text using language model enhanced decoding."
 )
 def install_requirements():
     requirements_path = 'requirements.txt'
@@ -116,7 +135,7 @@ if __name__ == "__main__":
         device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
         torch_dtype = torch.float16 if torch.cuda.is_available() else torch.float32
-        MODEL_NAME = "alakxender/wav2vec2-large-mms-1b-dv-syn-md" # Trained on 100% Synthetic Data (130-150 Hours)
         # MODEL_NAME = "alakxender/wav2vec2-large-mms-1b-cv" # Trained on Common Voice Data (Unknown Hours)
         # MODEL_NAME =  "alakxender/whisper-small-dv-syn-md" # Trained on 100% Synthetic Data (150 Hours)
         # MODEL_NAME = "alakxender/whisper-small-cv" # Trained on Common Voice Data (Unknown Hours)
@@ -142,6 +161,6 @@ if __name__ == "__main__":
         MAX_LENGTH = 120 # 2 minutes
         MIN_LENGTH = 1 # 1 second
-        iface.launch()
     else:
         print("Failed to install some requirements")

         return f"Error during transcription: {str(e)}"
 # Create Gradio interface
+css = """
+.textbox1 textarea {
+    font-size: 18px !important;
+    font-family: 'MV_Faseyha', 'Faruma', 'A_Faruma' !important;
+    line-height: 1.8 !important;
+}
+.textbox2 textarea {
+    display: none;
+}
+"""
+demo = gr.Blocks(css=css)
+tab_audio = gr.Interface(
     fn=transcribe,
+    inputs=[
+        gr.Audio(sources=["upload","microphone"], type="filepath", label="Audio"),
+    ],
+    outputs=gr.Textbox(label="Transcription", rtl=True, elem_classes="textbox1"),
+    title="Transcribe Dhivehi Audio",
+    allow_flagging="never",
 )
+with demo:
+    gr.TabbedInterface([tab_audio], ["Audio"])
 def install_requirements():
     requirements_path = 'requirements.txt'
         device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
         torch_dtype = torch.float16 if torch.cuda.is_available() else torch.float32
+        MODEL_NAME = "alakxender/wav2vec2-large-mms-1b-dv-syn-md" # Trained on 100% Synthetic Data (150 Hours)
         # MODEL_NAME = "alakxender/wav2vec2-large-mms-1b-cv" # Trained on Common Voice Data (Unknown Hours)
         # MODEL_NAME =  "alakxender/whisper-small-dv-syn-md" # Trained on 100% Synthetic Data (150 Hours)
         # MODEL_NAME = "alakxender/whisper-small-cv" # Trained on Common Voice Data (Unknown Hours)
         MAX_LENGTH = 120 # 2 minutes
         MIN_LENGTH = 1 # 1 second
+        demo.launch()
     else:
         print("Failed to install some requirements")