Spaces:

owaski-demo
/

Demo

Sleeping

App Files Files Community

chinmaydan commited on Feb 27, 2023

Commit

875c690

1 Parent(s): 35839aa

deciding on final language

Browse files

Files changed (1) hide show

app.py +8 -17

app.py CHANGED Viewed

@@ -10,18 +10,13 @@ model = whisper.load_model("small")
 # A table to look up all the languages
 language_id_lookup = {
             "English"   : "en",
             "German"    : "de",
-            "Greek"     : "el",
             "Spanish"   : "es",
-            "Finnish"   : "fi",
             "Russian"   : "ru",
-            "Hungarian" : "hu",
-            "Dutch"     : "nl",
             "French"    : "fr",
-            'Polish'    : "pl",
-            'Portuguese': "pt",
-            'Italian'   : "it",
             }
@@ -69,26 +64,22 @@ def predict(audio, language, mic_audio=None):
 title = "Demo for Whisper -> Something -> XLS-R"
 description = """
-<b>How to use:</b> Upload an audio file or record using the microphone. The audio is converted to mono and resampled to 16 kHz before
-being passed into the model. The output is the text transcription of the audio.
 """
 gr.Interface(
     fn=predict,
     inputs=[
         gr.Audio(label="Upload Speech", source="upload", type="filepath"),
-        gr.inputs.Dropdown(['English Text',
                             'German Text',
-                            'Greek Text',
                             'Spanish Text',
-                            'Finnish Text',
                             'Russian Text',
-                            'Hungarian Text',
-                            'Dutch Text',
                             'French Text',
-                            'Polish Text',
-                            'Portuguese Text',
-                            'Italian Text',
                             'Detect Language'], type="value", default='English Text', label="Select the Language of the that you are speaking in."),
         gr.Audio(label="Record Speech", source="microphone", type="filepath"),
     ],

 # A table to look up all the languages
 language_id_lookup = {
+            "Arabic"    : "ar",
             "English"   : "en",
+            "Chinese"   : "zh",
             "German"    : "de",
             "Spanish"   : "es",
             "Russian"   : "ru",
             "French"    : "fr",
             }
 title = "Demo for Whisper -> Something -> XLS-R"
 description = """
+<b>How to use:</b> Upload an audio file or record using the microphone. The audio is into the whisper model developed by openai.
+The output is the text transcription of the audio in the language you inputted. If you asked the model to detect a language, it will
+tell you what language it detected.
 """
 gr.Interface(
     fn=predict,
     inputs=[
         gr.Audio(label="Upload Speech", source="upload", type="filepath"),
+        gr.inputs.Dropdown(['Arabic Text',
+                            'Chinese Text',
+                            'English Text',
                             'German Text',
                             'Spanish Text',
                             'Russian Text',
                             'French Text',
                             'Detect Language'], type="value", default='English Text', label="Select the Language of the that you are speaking in."),
         gr.Audio(label="Record Speech", source="microphone", type="filepath"),
     ],