File size: 737 Bytes
704093d
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
import gradio as gr
import numpy as np
from pypdf import PdfReader
import os

def extract_text(file):

    """path = file
    normalized_path = os.path.normpath(path)
    normalized_path = normalized_path.replace("\\", "/")

    # creating a pdf reader object
    reader = PdfReader(file)

    text = []
    for p in np.arange(0, len(reader.pages), 1):
        page = reader.pages[int(p)]

        # extracting text from page
        text.append(page.extract_text())

    text = ' '.join(text)"""

    return file

with gr.Blocks() as demo:
    file_input = gr.File(label="Upload a PDF file")
    text_output = gr.Textbox(label="Extracted Text")
    file_input.upload(extract_text, inputs=file_input, outputs=text_output)

demo.launch()