Spaces:

shukdevdatta123
/

EngToJap-2.0

Running

App Files Files Community

shukdevdatta123 commited on Jan 14

Commit

6d9788c

verified ·

1 Parent(s): c495445

Update app.py

Browse files

Files changed (1) hide show

app.py +51 -14

app.py CHANGED Viewed

@@ -6,6 +6,7 @@ from gtts import gTTS
 import tempfile
 import shutil
 import re
 def translate_to_japanese(api_key, text):
     """
@@ -29,7 +30,7 @@ def translate_to_japanese(api_key, text):
     try:
         # Call the OpenAI API to get the Japanese translation
         response_translation = openai.ChatCompletion.create(
-            model="gpt-4o",  # Use the correct endpoint for chat models
             messages=messages_translation,
             max_tokens=300,
             temperature=0.5
@@ -46,7 +47,7 @@ def translate_to_japanese(api_key, text):
         # Call the OpenAI API to get the pronunciation
         response_pronunciation = openai.ChatCompletion.create(
-            model="gpt-4o",
             messages=messages_pronunciation,
             max_tokens=300,
             temperature=0.5
@@ -76,12 +77,32 @@ def generate_audio_from_text(text):
     tts.save(temp_audio_file.name)
     return temp_audio_file.name
 # Streamlit UI
 st.title("English to Japanese Translator with Pronunciation")
-st.markdown("Translate English text into Japanese and get its pronunciation (Romaji) using OpenAI's API.")
 translateimg = Image.open("Untitled.png")  # Ensure the file is in the correct directory
-st.image(translateimg, use_container_width=True)  # Adjust the size as per preference
 # Access the API key from Hugging Face Secrets
 api_key = os.getenv("OPENAI_API_KEY")
@@ -89,19 +110,17 @@ api_key = os.getenv("OPENAI_API_KEY")
 # Input field for the text
 english_text = st.text_area("Enter the English text to translate")
-# Button to trigger the translation
-if st.button("Translate"):
     if api_key and english_text:
         japanese_text, pronunciation = translate_to_japanese(api_key, english_text)
         if pronunciation:
-            # Clean pronunciation (remove unnecessary parts)
             cleaned_pronunciation = clean_pronunciation(pronunciation)
             st.markdown("### Translation Result:")
             st.write(f"**English Text:** {english_text}")
             st.write(f"**Japanese Output:** {japanese_text}")
             st.write(f"**Pronunciation:** {cleaned_pronunciation}")
             # Save the result in a text file
             result_text = f"English Text: {english_text}\n\nJapanese Translation: {japanese_text}\nPronunciation: {cleaned_pronunciation}"
@@ -120,12 +139,7 @@ if st.button("Translate"):
             # Generate audio for pronunciation
             audio_file_path = generate_audio_from_text(cleaned_pronunciation)
-            # Provide a button to play the pronunciation audio
             st.audio(audio_file_path, format="audio/mp3")
-            translateimg2 = Image.open("v3.png")  # Ensure the file is in the correct directory
-            st.image(translateimg2, width=150)  # Adjust the size as per preference
         else:
             st.error(japanese_text)  # Display error message if API call fails
     else:
@@ -133,3 +147,26 @@ if st.button("Translate"):
             st.error("API key is missing. Please add it as a secret in Hugging Face Settings.")
         else:
             st.error("Please provide text to translate.")

 import tempfile
 import shutil
 import re
+import speech_recognition as sr  # Library for voice recognition
 def translate_to_japanese(api_key, text):
     """
     try:
         # Call the OpenAI API to get the Japanese translation
         response_translation = openai.ChatCompletion.create(
+            model="gpt-4",  # Ensure using the correct endpoint for the GPT model
             messages=messages_translation,
             max_tokens=300,
             temperature=0.5
         # Call the OpenAI API to get the pronunciation
         response_pronunciation = openai.ChatCompletion.create(
+            model="gpt-4",
             messages=messages_pronunciation,
             max_tokens=300,
             temperature=0.5
     tts.save(temp_audio_file.name)
     return temp_audio_file.name
+# Function to capture and transcribe voice input
+def transcribe_voice_input():
+    recognizer = sr.Recognizer()
+    with sr.Microphone() as source:
+        st.info("Please speak now...")
+        recognizer.adjust_for_ambient_noise(source)
+        audio = recognizer.listen(source)
+        try:
+            # Use Google Web Speech API to transcribe audio
+            text = recognizer.recognize_google(audio)
+            st.success(f"Transcribed text: {text}")
+            return text
+        except sr.UnknownValueError:
+            st.error("Sorry, I could not understand the audio. Please try again.")
+            return None
+        except sr.RequestError:
+            st.error("Could not request results from Google Speech Recognition service.")
+            return None
 # Streamlit UI
 st.title("English to Japanese Translator with Pronunciation")
+st.markdown("Translate English text into Japanese and get its pronunciation (Romaji). You can input text or use voice.")
+# Display an image if you have one
 translateimg = Image.open("Untitled.png")  # Ensure the file is in the correct directory
+st.image(translateimg, use_container_width=True)
 # Access the API key from Hugging Face Secrets
 api_key = os.getenv("OPENAI_API_KEY")
 # Input field for the text
 english_text = st.text_area("Enter the English text to translate")
+# Button to trigger the translation from text input
+if st.button("Translate from Text"):
     if api_key and english_text:
         japanese_text, pronunciation = translate_to_japanese(api_key, english_text)
         if pronunciation:
             cleaned_pronunciation = clean_pronunciation(pronunciation)
             st.markdown("### Translation Result:")
             st.write(f"**English Text:** {english_text}")
             st.write(f"**Japanese Output:** {japanese_text}")
             st.write(f"**Pronunciation:** {cleaned_pronunciation}")
             # Save the result in a text file
             result_text = f"English Text: {english_text}\n\nJapanese Translation: {japanese_text}\nPronunciation: {cleaned_pronunciation}"
             # Generate audio for pronunciation
             audio_file_path = generate_audio_from_text(cleaned_pronunciation)
             st.audio(audio_file_path, format="audio/mp3")
         else:
             st.error(japanese_text)  # Display error message if API call fails
     else:
             st.error("API key is missing. Please add it as a secret in Hugging Face Settings.")
         else:
             st.error("Please provide text to translate.")
+# Button to trigger translation from voice input
+if st.button("Translate from Voice"):
+    if api_key:
+        voice_input = transcribe_voice_input()
+        if voice_input:
+            japanese_text, pronunciation = translate_to_japanese(api_key, voice_input)
+            if pronunciation:
+                cleaned_pronunciation = clean_pronunciation(pronunciation)
+                st.markdown("### Translation Result from Voice:")
+                st.write(f"**English Text (from Voice):** {voice_input}")
+                st.write(f"**Japanese Output:** {japanese_text}")
+                st.write(f"**Pronunciation:** {cleaned_pronunciation}")
+                # Generate audio for pronunciation
+                audio_file_path = generate_audio_from_text(cleaned_pronunciation)
+                st.audio(audio_file_path, format="audio/mp3")
+            else:
+                st.error(japanese_text)  # Display error message if API call fails
+        else:
+            st.error("Could not transcribe voice input.")
+    else:
+        st.error("API key is missing. Please add it as a secret in Hugging Face Settings.")