Spaces:

AI-Edify
/

Pronounciation_Assistant

Sleeping

App Files Files Community

AI-Edify commited on Sep 15, 2024

Commit

112a3e2

verified ·

1 Parent(s): b348d8d

Update app.py

Browse files

Files changed (1) hide show

app.py +12 -32

app.py CHANGED Viewed

@@ -1,51 +1,31 @@
 import os
 import gradio as gr
 import openai
-from openai import OpenAI
 import speech_recognition as sr
-import threading
 import time
-# Initialize OpenAI client with API key from environment variable
-client = OpenAI(api_key=os.environ.get("OPENAI_API_KEY"))
-# Create an assistant
-assistant = client.beta.assistants.create(
-    name="Pronunciation Assistant",
-    instructions="You are a helpful pronunciation assistant. You compare the generated text with the user's transcription and then provide feedback on how the user can improve their pronunciation accordingly. You also single out specific words they pronounced incorrectly and give tips on how to improve like for example 'schedule' can be pronounced as 'sked-jool'.",
-    model="gpt-4-1106-preview"
-)
 def generate_text():
-    response = client.chat.completions.create(
         model="gpt-3.5-turbo",
         messages=[
             {"role": "system", "content": "Generate a short paragraph (2-3 sentences) for an English learner to read aloud."},
             {"role": "user", "content": "Create a practice text."}
         ]
     )
-    return response.choices[0].message.content
 def get_pronunciation_feedback(original_text, transcription):
-    thread = client.beta.threads.create()
-    message = client.beta.threads.messages.create(
-        thread_id=thread.id,
-        role="user",
-        content=f"Original text: '{original_text}'\nTranscription: '{transcription}'\nProvide pronunciation feedback."
-    )
-    run = client.beta.threads.runs.create(
-        thread_id=thread.id,
-        assistant_id=assistant.id
     )
-    while run.status != "completed":
-        time.sleep(1)
-        run = client.beta.threads.runs.retrieve(thread_id=thread.id, run_id=run.id)
-    messages = client.beta.threads.messages.list(thread_id=thread.id)
-    return messages.data[0].content[0].text.value
 def transcribe_audio_realtime(audio):
     recognizer = sr.Recognizer()
@@ -68,7 +48,7 @@ def practice_pronunciation(audio):
 demo = gr.Interface(
     fn=practice_pronunciation,
     inputs=[
-        gr.Audio(type="filepath")  # Removed 'source="microphone"'
     ],
     outputs=[
         gr.Textbox(label="Text to Read"),

 import os
 import gradio as gr
 import openai
 import speech_recognition as sr
 import time
+# Set OpenAI API key
+openai.api_key = os.environ.get("OPENAI_API_KEY")
 def generate_text():
+    response = openai.ChatCompletion.create(
         model="gpt-3.5-turbo",
         messages=[
             {"role": "system", "content": "Generate a short paragraph (2-3 sentences) for an English learner to read aloud."},
             {"role": "user", "content": "Create a practice text."}
         ]
     )
+    return response.choices[0].message['content']
 def get_pronunciation_feedback(original_text, transcription):
+    response = openai.ChatCompletion.create(
+        model="gpt-3.5-turbo",
+        messages=[
+            {"role": "system", "content": "You are a helpful pronunciation assistant. Compare the generated text with the user's transcription and provide feedback on how the user can improve their pronunciation. Single out specific words they pronounced incorrectly and give tips on how to improve, like for example 'schedule' can be pronounced as 'sked-jool'."},
+            {"role": "user", "content": f"Original text: '{original_text}'\nTranscription: '{transcription}'\nProvide pronunciation feedback."}
+        ]
     )
+    return response.choices[0].message['content']
 def transcribe_audio_realtime(audio):
     recognizer = sr.Recognizer()
 demo = gr.Interface(
     fn=practice_pronunciation,
     inputs=[
+        gr.Audio(type="filepath")
     ],
     outputs=[
         gr.Textbox(label="Text to Read"),