Spaces:
Runtime error
Runtime error
Update app.py
Browse files
app.py
CHANGED
@@ -125,6 +125,11 @@ def PDFChunkerWithSeparator(filepath, separator):
|
|
125 |
|
126 |
def loadKB(fileprovided, urlProvided, uploads_dir, request):
|
127 |
documents = []
|
|
|
|
|
|
|
|
|
|
|
128 |
if fileprovided:
|
129 |
# Delete Files
|
130 |
clearKBUploadDirectory(uploads_dir)
|
@@ -134,11 +139,8 @@ def loadKB(fileprovided, urlProvided, uploads_dir, request):
|
|
134 |
file.save(os.path.join(uploads_dir, secure_filename(file.filename)))
|
135 |
#loader = PyPDFLoader(os.path.join(uploads_dir, secure_filename(file.filename)))
|
136 |
#documents.extend(loader.load())
|
137 |
-
|
138 |
-
|
139 |
-
global tokenizer
|
140 |
-
#tokenizer = LlamaTokenizer.from_pretrained(savedModelPath)
|
141 |
-
tokenizer = AutoTokenizer.from_pretrained("bert-base-cased")
|
142 |
separator = "</Q>"
|
143 |
documents.extend(PDFChunkerWithSeparator(os.path.join(uploads_dir, secure_filename(file.filename)),separator))
|
144 |
else:
|
|
|
125 |
|
126 |
def loadKB(fileprovided, urlProvided, uploads_dir, request):
|
127 |
documents = []
|
128 |
+
global tokenizer
|
129 |
+
BASE_MODEL = "LLAMA-TOKENIZER"
|
130 |
+
savedModelPath = "./model/" + BASE_MODEL
|
131 |
+
#tokenizer = LlamaTokenizer.from_pretrained(savedModelPath)
|
132 |
+
tokenizer = AutoTokenizer.from_pretrained("bert-base-cased")
|
133 |
if fileprovided:
|
134 |
# Delete Files
|
135 |
clearKBUploadDirectory(uploads_dir)
|
|
|
139 |
file.save(os.path.join(uploads_dir, secure_filename(file.filename)))
|
140 |
#loader = PyPDFLoader(os.path.join(uploads_dir, secure_filename(file.filename)))
|
141 |
#documents.extend(loader.load())
|
142 |
+
|
143 |
+
|
|
|
|
|
|
|
144 |
separator = "</Q>"
|
145 |
documents.extend(PDFChunkerWithSeparator(os.path.join(uploads_dir, secure_filename(file.filename)),separator))
|
146 |
else:
|