aminaj commited on
Commit
e3cf4fe
·
verified ·
1 Parent(s): 399cab8

Update backend/pdf_ingestion.py

Browse files
Files changed (1) hide show
  1. backend/pdf_ingestion.py +2 -2
backend/pdf_ingestion.py CHANGED
@@ -9,8 +9,8 @@ def load_split_pdf(file_path):
9
 
10
  # Initialize the recursive character text splitter
11
  text_splitter = RecursiveCharacterTextSplitter(
12
- chunk_size=500, # Set the maximum chunk size
13
- chunk_overlap=50, # Set the number of overlapping characters between chunks
14
  separators=["\n\n", "\n", " ", ""], # Define resume-specific separators for splitting
15
  )
16
 
 
9
 
10
  # Initialize the recursive character text splitter
11
  text_splitter = RecursiveCharacterTextSplitter(
12
+ chunk_size=100, # Set the maximum chunk size
13
+ chunk_overlap=20, # Set the number of overlapping characters between chunks
14
  separators=["\n\n", "\n", " ", ""], # Define resume-specific separators for splitting
15
  )
16