Spaces:

cdactvm
/

Telugu_kannada_ASR_Demo

Sleeping

App Files Files Community

cdactvm commited on Jan 16

Commit

6484054

verified ·

1 Parent(s): 815dd35

Update app.py

Browse files

Files changed (1) hide show

app.py +100 -1

app.py CHANGED Viewed

@@ -31,7 +31,105 @@ from scipy.signal import butter, lfilter, wiener
 asr_model = pipeline("automatic-speech-recognition", model="cdactvm/telugu_w2v-bert_model")
 # Function to apply a high-pass filter
 def high_pass_filter(audio, sr, cutoff=300):
     nyquist = 0.5 * sr
@@ -62,12 +160,13 @@ def recognize_speech(audio_file):
     result = asr_model(denoised_audio)
     text_value = result['text']
     cleaned_text = text_value.replace("<s>", "")
     # cleaned_text=convert2num(cleaned_text,lex)
     # converted_to_list = convert_to_list(cleaned_text, text_to_list())
     # processed_doubles = process_doubles(converted_to_list)
     # replaced_words = replace_words(processed_doubles)
     # converted_text = text_to_int(replaced_words)
-    return cleaned_text
 def sel_lng(lng, mic=None, file=None):
     if mic is not None:

 asr_model = pipeline("automatic-speech-recognition", model="cdactvm/telugu_w2v-bert_model")
+def createlex(filename):
+#filename = "num_map.txt"
+# Initialize an empty dictionary
+    data_dict = {}
+# Open the file and read it line by line
+    with open(filename, "r", encoding="utf-8") as f:
+        for line in f:
+        # Strip newline characters and split by tab
+            key, value = line.strip().split("\t")
+        # Add to dictionary
+            data_dict[key] = value
+    return data_dict
+lex=createlex("num_words_tel.txt")
+def addnum(inlist):
+    sum=0
+    for num in inlist:
+        sum+=int(num)
+    return sum
+from rapidfuzz import process
+def get_val(word, lexicon):
+    threshold = 80  # Minimum similarity score
+    length_difference = 4
+    #length_range = (4, 6)  # Acceptable character length range (min, max)
+    # Find the best match above the similarity threshold
+    result = process.extractOne(word, lexicon.keys(), score_cutoff=threshold)
+    print (result)
+    if result:
+        match, score, _ = result
+        #print(lexicon[match])
+        #return lexicon[match]
+        if abs(len(match) - len(word)) <= length_difference:
+        #if length_range[0] <= len(match) <= length_range[1]:
+            return lexicon[match]
+        else:
+            return None
+    else:
+        return None
+def convert2num(input, lex):
+    input += " #"  # Add a period for termination
+    words = input.split()
+    i = 0
+    num = 0
+    outstr = ""
+    digit_end = True
+    numlist = []
+    addflag = False
+    prevword=""
+    single_list=[0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,15,17,18,19]
+    # Process the words
+    while i < len(words):
+        #checkwordlist = handleSpecialnum(words[i])
+        # Handle special numbers
+        #if len(checkwordlist) == 2:
+        #    words[i] = checkwordlist[0]
+        #    words.insert(i + 1, checkwordlist[1])  # Collect new word for later processing
+        # Get numerical value of the word
+        numval = get_val(words[i], lex)
+        if numval is not None:
+            if prevword not in single_list:
+                addflag = True
+                numlist.append(numval)
+            else:
+                if addflag:
+                    numlist.append(numval)
+                    num = addnum(numlist)
+                    outstr += str(num) + " "
+                    addflag = False
+                    numlist = []
+                else:
+                    outstr += " " + str(numval) + " "
+            digit_end = False
+            prevword=numval
+        else:
+             prevword=""
+            if addflag:
+                num = addnum(numlist)
+                outstr += str(num) + " " + words[i] + " "
+                addflag = False
+                numlist = []
+            else:
+                outstr += words[i] + " "
+            if not digit_end:
+                digit_end = True
+        # Move to the next word
+        i += 1
+    # Final processing
+    outstr = outstr.replace('#','')  # Remove trailing spaces
+    return outstr
 # Function to apply a high-pass filter
 def high_pass_filter(audio, sr, cutoff=300):
     nyquist = 0.5 * sr
     result = asr_model(denoised_audio)
     text_value = result['text']
     cleaned_text = text_value.replace("<s>", "")
+    converted_text=convert2num(cleaned_text,lex)
     # cleaned_text=convert2num(cleaned_text,lex)
     # converted_to_list = convert_to_list(cleaned_text, text_to_list())
     # processed_doubles = process_doubles(converted_to_list)
     # replaced_words = replace_words(processed_doubles)
     # converted_text = text_to_int(replaced_words)
+    return cleaned_text +" -----------------> " + converted_text
 def sel_lng(lng, mic=None, file=None):
     if mic is not None: