Spaces:
Runtime error
Runtime error
import streamlit as st | |
from gtts import gTTS | |
from io import BytesIO | |
import torch | |
import torchaudio | |
from PyPDF2 import PdfReader | |
from whisperspeech.pipeline import Pipeline | |
st.image('OIG3 (4).jpeg', caption='Your host on this PDF-to-Speech adventure!') | |
st.write("β³ Loading WhisperSpeech Pipeline β") | |
pipe = Pipeline(torch_compile=True) | |
# TTS pipeline | |
x = st.slider('Select the number of pages you wish to transcribe') | |
uploaded_file = st.file_uploader("Choose a file", "pdf") | |
if uploaded_file is not None: | |
# creating a pdf reader object | |
reader = PdfReader(uploaded_file) | |
# printing number of pages in pdf file | |
X = len(reader.pages) | |
print(X) | |
i = 0 | |
while i <= X and i <= x: | |
# getting a specific page from the pdf file | |
page = reader.pages[i] | |
# extracting text from page | |
text = page.extract_text() | |
print("Created text of page", i ) | |
# Generate audio for the current page using a unique filename | |
page_audio_file = f"output_{i}.wav" | |
pipe.generate_to_file(page_audio_file, text) | |
# Display the generated audio using st.audio | |
with open(page_audio_file, "rb") as audio_file: | |
st.audio(audio_file) | |
# sound_file = BytesIO() | |
# tts = gTTS(text, lang='en') | |
# tts.write_to_fp(sound_file) | |
# st.audio(sound_file) | |
print("Read aloud", i, "pages of", X, "total pages.") | |
i = i + 1 | |
st.write("π That's the whole PDF! Have an awesome day! π") | |
prompt = st.chat_input("Copy/Paste or type in text to have read aloud") | |
if prompt: | |
st.write(prompt) | |
with st.popover("β¨ Open your text-to-speech from text input β¨"): | |
#sound_file = BytesIO() | |
#tts = gTTS(prompt, lang='en') | |
#tts.write_to_fp(sound_file) | |
#st.audio(sound_file) | |
# Generate audio for the current page using a unique filename | |
page_audio_file = f"output_{i}.wav" | |
pipe.generate_to_file(page_audio_file, text) | |
# Display the generated audio using st.audio | |
with open(page_audio_file, "rb") as audio_file: | |
st.audio(audio_file) | |