Spaces:

cdactvm
/

demoASR

Sleeping

App Files Files Community

cdactvm commited on Aug 6, 2024

Commit

968793a

verified ·

1 Parent(s): 6efc2bb

Update app.py

Browse files

Files changed (1) hide show

app.py +25 -1

app.py CHANGED Viewed

@@ -11,6 +11,7 @@ import re
 # Initialize the speech recognition pipeline and transliterator
 p1 = pipeline(task="automatic-speech-recognition", model="cdactvm/w2v-bert-2.0-odia_v1")
 p2 = pipeline(task="automatic-speech-recognition", model="cdactvm/w2v-bert-2.0-hindi_v1")
 #p3 = pipeline(task="automatic-speech-recognition", model="cdactvm/kannada_w2v-bert_model")
 #p4 = pipeline(task="automatic-speech-recognition", model="cdactvm/telugu_w2v-bert_model")
@@ -47,7 +48,26 @@ def transcribe_odiya(speech):
         return "Error: ASR returned None"
     return text
 def cleanhtml(raw_html):
     cleantext = re.sub(r'<.*?>', '', raw_html)
     return cleantext
@@ -196,7 +216,11 @@ def sel_lng(lng, mic=None, file=None):
     elif lng == "Assamese-LM":
        return transcribe_assamese_LM(audio)
     elif lng == "Assamese-Model2":
        return transcribe_assamese_model2(audio)
 # Function to replace incorrectly spelled words
@@ -423,7 +447,7 @@ demo=gr.Interface(
     inputs=[
         #gr.Dropdown(["Hindi","Hindi-trans","Odiya","Odiya-trans","Kannada","Kannada-trans","Telugu","Telugu-trans","Bangala","Bangala-trans"],value="Hindi",label="Select Language"),
-        gr.Dropdown(["Hindi","Hindi-trans","Odiya","Odiya-trans","Assamese-LM","Assamese-Model2"],value="Hindi",label="Select Language"),
         gr.Audio(sources=["microphone","upload"], type="filepath"),
         #gr.Audio(sources="upload", type="filepath"),
         #"state"

 # Initialize the speech recognition pipeline and transliterator
 p1 = pipeline(task="automatic-speech-recognition", model="cdactvm/w2v-bert-2.0-odia_v1")
+odia-model2 = pipeline(task="automatic-speech-recognition", model="cdactvm/w2v-bert-odia_v1")
 p2 = pipeline(task="automatic-speech-recognition", model="cdactvm/w2v-bert-2.0-hindi_v1")
 #p3 = pipeline(task="automatic-speech-recognition", model="cdactvm/kannada_w2v-bert_model")
 #p4 = pipeline(task="automatic-speech-recognition", model="cdactvm/telugu_w2v-bert_model")
         return "Error: ASR returned None"
     return text
+###################################
+def transcribe_odiya_model2(speech):
+    text = odia-model2(speech)["text"]
+    if text is None:
+        return "Error: ASR returned None"
+    return text
+def transcribe_odiya_eng_model2(speech):
+    trn = Transliterator(source='ori', target='eng', build_lookup=True)
+    text = odia-model2(speech)["text"]
+    if text is None:
+        return "Error: ASR returned None"
+    sentence = trn.transform(text)
+    if sentence is None:
+        return "Error: Transliteration returned None"
+    replaced_words = replace_words(sentence)
+    processed_sentence = process_doubles(replaced_words)
+    return process_transcription(processed_sentence)
+########################################
 def cleanhtml(raw_html):
     cleantext = re.sub(r'<.*?>', '', raw_html)
     return cleantext
     elif lng == "Assamese-LM":
        return transcribe_assamese_LM(audio)
     elif lng == "Assamese-Model2":
+       return transcribe_odiya_model2(audio)
+    elif lng == "Odia_model2":
        return transcribe_assamese_model2(audio)
+    elif lng == "Odia_trans_model2":
+       return transcribe_odiya_eng_model2(audio)
 # Function to replace incorrectly spelled words
     inputs=[
         #gr.Dropdown(["Hindi","Hindi-trans","Odiya","Odiya-trans","Kannada","Kannada-trans","Telugu","Telugu-trans","Bangala","Bangala-trans"],value="Hindi",label="Select Language"),
+        gr.Dropdown(["Hindi","Hindi-trans","Odiya","Odiya-trans","Odia_model2","Odia_trans_model2","Assamese-LM","Assamese-Model2"],value="Hindi",label="Select Language"),
         gr.Audio(sources=["microphone","upload"], type="filepath"),
         #gr.Audio(sources="upload", type="filepath"),
         #"state"