Spaces:
Sleeping
Sleeping
Update PDF_Reader.py
Browse files- PDF_Reader.py +2 -2
PDF_Reader.py
CHANGED
@@ -27,8 +27,8 @@ def replace_t_with_space(list_of_documents):
|
|
27 |
def read_pdf_text(pdf_path):
|
28 |
text = ""
|
29 |
pdf_reader = PdfReader(pdf_path)
|
30 |
-
|
31 |
-
|
32 |
|
33 |
text_splitter = RecursiveCharacterTextSplitter(chunk_size=10000, chunk_overlap=1000)
|
34 |
text_chunks = text_splitter.split_text(text)
|
|
|
27 |
def read_pdf_text(pdf_path):
|
28 |
text = ""
|
29 |
pdf_reader = PdfReader(pdf_path)
|
30 |
+
for page in pdf_reader.pages:
|
31 |
+
text += page.extract_text()
|
32 |
|
33 |
text_splitter = RecursiveCharacterTextSplitter(chunk_size=10000, chunk_overlap=1000)
|
34 |
text_chunks = text_splitter.split_text(text)
|