Spaces:

nimool
/

gbn_test

Sleeping

App Files Files Community

nimool commited on Oct 4, 2023

Commit

c442756

1 Parent(s): 121ba7f

Update app.py

Browse files

Files changed (1) hide show

app.py +22 -2

app.py CHANGED Viewed

@@ -5,6 +5,7 @@ import gradio as gr
 import sox
 import subprocess
 from fuzzywuzzy import fuzz
 def read_file_and_process(wav_file):
@@ -35,7 +36,26 @@ def parse(wav_file):
     input_values = read_file_and_process(wav_file)
     with torch.no_grad():
         logits = model(**input_values).logits
-    return parse_transcription(logits)
 model_id = "jonatasgrosman/wav2vec2-large-xlsr-53-persian"
 processor = Wav2Vec2Processor.from_pretrained(model_id)
@@ -59,7 +79,7 @@ title = "Speech-to-Text (persian)"
 description = "، توجه داشته باشید که هرچه گفتار شما شمرده تر باشد خروجی با کیفیت تری دارید.روی دکمه ضبط صدا کلیک کنید و سپس دسترسی مرورگر خود را به میکروفون دستگاه بدهید، سپس شروع به صحبت کنید و برای اتمام ضبط دوباره روی دکمه کلیک کنید"
 article = "<p style='text-align: center'><a href='https://github.com/nimaprgrmr'>Large-Scale Self- and Semi-Supervised Learning for Speech Translation</a></p>"
-demo = gr.Interface(fn=parse, inputs = input_,  outputs=txtbox, title=title, description=description, article = article,
              streaming=True, interactive=True,
              analytics_enabled=False, show_tips=False, enable_queue=True)
 demo.launch(share=True)

 import sox
 import subprocess
 from fuzzywuzzy import fuzz
+from data import dataset
 def read_file_and_process(wav_file):
     input_values = read_file_and_process(wav_file)
     with torch.no_grad():
         logits = model(**input_values).logits
+    user_question = parse_transcription(logits)
+    return user_question
+# Function to retrieve an answer based on a question (using fuzzy matching)
+def get_answer(user_question):
+    highest_score = 0
+    best_answer = None
+    for item in dataset:
+        similarity_score = fuzz.token_set_ratio(user_question, item["question"])
+        if similarity_score > highest_score:
+            highest_score = similarity_score
+            best_answer = item["answer"]
+    if highest_score >= 80:  # Adjust the similarity threshold as needed
+        return best_answer
+    else:
+        return "I don't have an answer to that question."
 model_id = "jonatasgrosman/wav2vec2-large-xlsr-53-persian"
 processor = Wav2Vec2Processor.from_pretrained(model_id)
 description = "، توجه داشته باشید که هرچه گفتار شما شمرده تر باشد خروجی با کیفیت تری دارید.روی دکمه ضبط صدا کلیک کنید و سپس دسترسی مرورگر خود را به میکروفون دستگاه بدهید، سپس شروع به صحبت کنید و برای اتمام ضبط دوباره روی دکمه کلیک کنید"
 article = "<p style='text-align: center'><a href='https://github.com/nimaprgrmr'>Large-Scale Self- and Semi-Supervised Learning for Speech Translation</a></p>"
+demo = gr.Interface(fn=get_answer, inputs = input_,  outputs=txtbox, title=title, description=description, article = article,
              streaming=True, interactive=True,
              analytics_enabled=False, show_tips=False, enable_queue=True)
 demo.launch(share=True)