Spaces:

pradeep4321
/

text2speech

Sleeping

App Files Files Community

pradeep4321 commited on May 19

Commit

1f6832e

verified ·

1 Parent(s): b90401c

Update src/app.py

Browse files

Files changed (1) hide show

src/app.py +44 -60

src/app.py CHANGED Viewed

@@ -1,80 +1,64 @@
 import os
 import tempfile
-import pyttsx3
 from docx import Document
 from PyPDF2 import PdfReader
 import streamlit as st
-import base64  # Add this import
 from io import BytesIO
-def text_to_speech(text, output_file):
-    engine = pyttsx3.init()
-    engine.setProperty('rate', 150)
-    voices = engine.getProperty('voices')
-    engine.setProperty('voice', voices[1].id)
-    engine.save_to_file(text, output_file)
-    engine.runAndWait()
 def convert_docx_to_text(docx_file):
     doc = Document(docx_file)
-    text = ""
-    for paragraph in doc.paragraphs:
-        text += paragraph.text + "\n"
-    return text
 def convert_pdf_to_text(pdf_file):
-    text = ""
-    pdf_reader = PdfReader(pdf_file)
-    for page in pdf_reader.pages:
-        text += page.extract_text()
-    return text
 def main():
-    st.title("Text to Speech Converter")
     uploaded_file = st.file_uploader("Upload a text, docx, or pdf file", type=["txt", "docx", "pdf"])
     if uploaded_file:
-        try:
-            # Save uploaded file content to a temporary file
-            temp_file = tempfile.NamedTemporaryFile(delete=False)
-            temp_file.write(uploaded_file.read())
-            temp_file.close()
-            file_extension = uploaded_file.name.split('.')[-1]
-            if file_extension.lower() == 'txt':
-                with open(temp_file.name, 'r', encoding='utf-8') as txt_file:
-                    text = txt_file.read()
-            elif file_extension.lower() == 'docx':
-                text = convert_docx_to_text(temp_file.name)
-            elif file_extension.lower() == 'pdf':
-                text = convert_pdf_to_text(temp_file.name)
-            else:
-                st.error("Unsupported file format")
-                return
-            with st.spinner("Converting text to speech..."):
-                output_audio_file = "output.mp3"
-                text_to_speech(text, output_audio_file)
-            st.audio(output_audio_file, format="audio/mp3", start_time=0)
-            # Provide a download link for the audio file
-            with open(output_audio_file, 'rb') as audio_file:
-                audio_bytes = audio_file.read()
-            st.markdown(get_binary_file_downloader_html(audio_bytes, output_audio_file), unsafe_allow_html=True)
-        except Exception as e:
-            st.error(f"An error occurred: {str(e)}")
-# Function to create a download link
-def get_binary_file_downloader_html(bin_file, file_label='File'):
-    with st.spinner("Preparing download link..."):
-        data = bin_file
-        b64 = base64.b64encode(data).decode()
-        href = f'<a href="data:application/octet-stream;base64,{b64}" download="{file_label}" target="_blank">Download {file_label}</a>'
-        return href
-if __name__ == '__main__':
     main()

 import os
+os.environ["STREAMLIT_CONFIG_DIR"] = "/tmp/.streamlit"
+os.makedirs("/tmp/.streamlit", exist_ok=True)
 import tempfile
+from gtts import gTTS
 from docx import Document
 from PyPDF2 import PdfReader
 import streamlit as st
+import base64
 from io import BytesIO
+def text_to_speech(text):
+    tts = gTTS(text)
+    audio_buffer = BytesIO()
+    tts.write_to_fp(audio_buffer)
+    audio_buffer.seek(0)
+    return audio_buffer
 def convert_docx_to_text(docx_file):
     doc = Document(docx_file)
+    return "\n".join([p.text for p in doc.paragraphs])
 def convert_pdf_to_text(pdf_file):
+    reader = PdfReader(pdf_file)
+    return "\n".join([page.extract_text() or '' for page in reader.pages])
+def get_download_link(audio_data, filename="output.mp3"):
+    b64 = base64.b64encode(audio_data).decode()
+    href = f'<a href="data:audio/mp3;base64,{b64}" download="{filename}">Download {filename}</a>'
+    return href
 def main():
+    st.title("Text to Speech Converter (No File Write)")
     uploaded_file = st.file_uploader("Upload a text, docx, or pdf file", type=["txt", "docx", "pdf"])
     if uploaded_file:
+        ext = uploaded_file.name.split('.')[-1].lower()
+        text = ""
+        if ext == 'txt':
+            text = uploaded_file.read().decode("utf-8")
+        elif ext == 'docx':
+            text = convert_docx_to_text(uploaded_file)
+        elif ext == 'pdf':
+            text = convert_pdf_to_text(uploaded_file)
+        else:
+            st.error("Unsupported file format")
+            return
+        if not text.strip():
+            st.warning("No readable text found.")
+            return
+        with st.spinner("Converting to speech..."):
+            audio_buffer = text_to_speech(text)
+            audio_bytes = audio_buffer.read()
+        st.audio(audio_bytes, format="audio/mp3")
+        st.markdown(get_download_link(audio_bytes), unsafe_allow_html=True)
+if __name__ == "__main__":
     main()