demoPOC commited on
Commit
288a785
·
1 Parent(s): 02a16b9

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +9 -2
app.py CHANGED
@@ -132,8 +132,15 @@ def loadKB(fileprovided, urlProvided, uploads_dir, request):
132
  for file in request.files.getlist('files[]'):
133
  print("File Received>>>" + file.filename)
134
  file.save(os.path.join(uploads_dir, secure_filename(file.filename)))
135
- loader = PyPDFLoader(os.path.join(uploads_dir, secure_filename(file.filename)))
136
- documents.extend(loader.load())
 
 
 
 
 
 
 
137
  else:
138
  loader = TextLoader('Jio.txt')
139
  documents.extend(loader.load())
 
132
  for file in request.files.getlist('files[]'):
133
  print("File Received>>>" + file.filename)
134
  file.save(os.path.join(uploads_dir, secure_filename(file.filename)))
135
+ #loader = PyPDFLoader(os.path.join(uploads_dir, secure_filename(file.filename)))
136
+ #documents.extend(loader.load())
137
+ BASE_MODEL = "LLAMA-TOKENIZER"
138
+ savedModelPath = "./model/" + BASE_MODEL
139
+ global tokenizer
140
+ #tokenizer = LlamaTokenizer.from_pretrained(savedModelPath)
141
+ tokenizer = AutoTokenizer.from_pretrained("bert-base-cased")
142
+ separator = "</Q>"
143
+ documents.extend(PDFChunkerWithSeparator(os.path.join(uploads_dir, secure_filename(file.filename)),separator))
144
  else:
145
  loader = TextLoader('Jio.txt')
146
  documents.extend(loader.load())