Namitg02 commited on
Commit
f7d0c53
·
verified ·
1 Parent(s): 7cf2ad5

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +1 -1
app.py CHANGED
@@ -5,7 +5,7 @@ dataset = load_dataset("Namitg02/Test")
5
 
6
 
7
  from langchain.text_splitter import RecursiveCharacterTextSplitter
8
- splitter = RecursiveCharacterTextSplitter(chunk_size=512, chunk_overlap=30)
9
  docs = splitter.split_text(dataset)
10
 
11
 
 
5
 
6
 
7
  from langchain.text_splitter import RecursiveCharacterTextSplitter
8
+ splitter = RecursiveCharacterTextSplitter(chunk_size=100, chunk_overlap=15,separators=["\n\n", "\n", "\. ", " ", ""])
9
  docs = splitter.split_text(dataset)
10
 
11