Spaces:

nailarais1
/

accessible-math-solver

Sleeping

App Files Files Community

nailarais1 commited on Dec 14, 2024

Commit

1c668c5

verified ·

1 Parent(s): 9a12661

Update app.py

Browse files

Files changed (1) hide show

app.py +28 -21

app.py CHANGED Viewed

@@ -5,24 +5,30 @@ import os
 import gradio as gr
 # Function to convert speech to text using CMU Sphinx
-def voice_to_text():
     recognizer = sr.Recognizer()
-    # Using the default microphone as the audio source
-    with sr.Microphone() as source:
-        print("Please speak a math expression (e.g., '2 plus 2', 'integrate x squared')...")
-        recognizer.adjust_for_ambient_noise(source)
-        audio = recognizer.listen(source)
-        try:
-            # Using CMU Sphinx for offline recognition
-            text = recognizer.recognize_sphinx(audio)
-            print(f"Recognized text: {text}")
-            return text
-        except sr.UnknownValueError:
-            return "Sorry, I could not understand the audio."
-        except sr.RequestError:
-            return "Could not request results from Sphinx service."
 # Function to map speech to mathematical symbols
 def convert_speech_to_math(text):
@@ -74,10 +80,10 @@ def process_math(query):
         return f"Error: Unable to process the query. Please check the syntax. Error: {e}", None
 # Gradio interface function to handle the input
-def calculator(choice, text_input=None):
     if choice == "voice":
-        # Convert speech to text using CMU Sphinx
-        query = voice_to_text()
         if query.lower() == "sorry, i could not understand the audio.":
             return query, None
@@ -103,7 +109,8 @@ def start_interface():
         fn=calculator,
         inputs=[
             gr.Radio(["voice", "text"], label="Choose Input Type"),  # Option to select between voice and text input
-            gr.Textbox(label="Or Type a Math Expression (Optional)", placeholder="Type your math expression here...", visible=False)  # Hidden text input when voice is selected
         ],
         outputs=[
             "text",  # Display the result text
@@ -115,7 +122,7 @@ def start_interface():
         live=True  # Allow live updating as the user interacts
     )
-    interface.launch()
 if __name__ == "__main__":
     start_interface()

 import gradio as gr
 # Function to convert speech to text using CMU Sphinx
+def voice_to_text_from_microphone(audio=None):
     recognizer = sr.Recognizer()
+    # If audio file is provided, use it. Otherwise, record from the microphone.
+    if audio:
+        # Using uploaded audio file
+        with sr.AudioFile(audio) as source:
+            audio_data = recognizer.record(source)
+    else:
+        # Using the default microphone as the audio source
+        with sr.Microphone() as source:
+            print("Please speak a math expression...")
+            recognizer.adjust_for_ambient_noise(source)
+            audio_data = recognizer.listen(source)
+    try:
+        # Using CMU Sphinx for offline recognition
+        text = recognizer.recognize_sphinx(audio_data)
+        print(f"Recognized text: {text}")
+        return text
+    except sr.UnknownValueError:
+        return "Sorry, I could not understand the audio."
+    except sr.RequestError:
+        return "Could not request results from Sphinx service."
 # Function to map speech to mathematical symbols
 def convert_speech_to_math(text):
         return f"Error: Unable to process the query. Please check the syntax. Error: {e}", None
 # Gradio interface function to handle the input
+def calculator(choice, text_input=None, audio=None):
     if choice == "voice":
+        # Convert speech to text using CMU Sphinx from the microphone or uploaded audio
+        query = voice_to_text_from_microphone(audio)
         if query.lower() == "sorry, i could not understand the audio.":
             return query, None
         fn=calculator,
         inputs=[
             gr.Radio(["voice", "text"], label="Choose Input Type"),  # Option to select between voice and text input
+            gr.Textbox(label="Or Type a Math Expression (Optional)", placeholder="Type your math expression here...", visible=False),  # Hidden text input when voice is selected
+            gr.Audio(label="Upload an Audio File (Optional)", type="filepath", visible=False)  # Option to upload an audio file
         ],
         outputs=[
             "text",  # Display the result text
         live=True  # Allow live updating as the user interacts
     )
+    interface.launch()(share=true)
 if __name__ == "__main__":
     start_interface()