Spaces:
Running
Running
Update backend/pdf_ingestion.py
Browse files- backend/pdf_ingestion.py +2 -2
backend/pdf_ingestion.py
CHANGED
@@ -9,8 +9,8 @@ def load_split_pdf(file_path):
|
|
9 |
|
10 |
# Initialize the recursive character text splitter
|
11 |
text_splitter = RecursiveCharacterTextSplitter(
|
12 |
-
chunk_size=
|
13 |
-
chunk_overlap=
|
14 |
separators=["\n\n", "\n", " ", ""], # Define resume-specific separators for splitting
|
15 |
)
|
16 |
|
|
|
9 |
|
10 |
# Initialize the recursive character text splitter
|
11 |
text_splitter = RecursiveCharacterTextSplitter(
|
12 |
+
chunk_size=100, # Set the maximum chunk size
|
13 |
+
chunk_overlap=20, # Set the number of overlapping characters between chunks
|
14 |
separators=["\n\n", "\n", " ", ""], # Define resume-specific separators for splitting
|
15 |
)
|
16 |
|