Samarth991 commited on
Commit
73bf17a
·
verified ·
1 Parent(s): 91be402

Update PDF_Reader.py

Browse files
Files changed (1) hide show
  1. PDF_Reader.py +2 -2
PDF_Reader.py CHANGED
@@ -27,8 +27,8 @@ def replace_t_with_space(list_of_documents):
27
  def read_pdf_text(pdf_path):
28
  text = ""
29
  pdf_reader = PdfReader(pdf_path)
30
- for page in pdf_reader.pages:
31
- text += page.extract_text()
32
 
33
  text_splitter = RecursiveCharacterTextSplitter(chunk_size=10000, chunk_overlap=1000)
34
  text_chunks = text_splitter.split_text(text)
 
27
  def read_pdf_text(pdf_path):
28
  text = ""
29
  pdf_reader = PdfReader(pdf_path)
30
+ for page in pdf_reader.pages:
31
+ text += page.extract_text()
32
 
33
  text_splitter = RecursiveCharacterTextSplitter(chunk_size=10000, chunk_overlap=1000)
34
  text_chunks = text_splitter.split_text(text)