playground / app.py
xavierbarbier's picture
Create app.py
704093d verified
raw
history blame
737 Bytes
import gradio as gr
import numpy as np
from pypdf import PdfReader
import os
def extract_text(file):
"""path = file
normalized_path = os.path.normpath(path)
normalized_path = normalized_path.replace("\\", "/")
# creating a pdf reader object
reader = PdfReader(file)
text = []
for p in np.arange(0, len(reader.pages), 1):
page = reader.pages[int(p)]
# extracting text from page
text.append(page.extract_text())
text = ' '.join(text)"""
return file
with gr.Blocks() as demo:
file_input = gr.File(label="Upload a PDF file")
text_output = gr.Textbox(label="Extracted Text")
file_input.upload(extract_text, inputs=file_input, outputs=text_output)
demo.launch()