|
import gradio as gr |
|
from langchain.document_loaders import PDFMinerLoader, PyMuPDFLoader |
|
from langchain.text_splitter import CharacterTextSplitter |
|
|
|
|
|
|
|
import gradio as gr |
|
|
|
def upload_pdf(file): |
|
|
|
file_name = file.name |
|
pdf_filename = os.path.basename(file_path) |
|
|
|
|
|
loader = PDFMinerLoader(pdf_filename) |
|
doc = loader.load() |
|
|
|
text_splitter = CharacterTextSplitter(chunk_size=1000, chunk_overlap=0) |
|
texts = text_splitter.split_documents(doc) |
|
|
|
texts = [i.page_content for i in texts] |
|
|
|
return texts[0] |
|
|
|
iface = gr.Interface( |
|
fn=upload_pdf, |
|
inputs="file", |
|
outputs="text", |
|
title="PDF File Uploader", |
|
description="Upload a PDF file and get its filename.", |
|
) |
|
|
|
iface.launch() |
|
|
|
|