Spaces:
Sleeping
Sleeping
Update app.py
Browse files
app.py
CHANGED
@@ -69,33 +69,35 @@ def preprocess_text(text):
|
|
69 |
sentences = sent_tokenize(text)
|
70 |
return sentences
|
71 |
|
72 |
-
def upload_files(
|
73 |
global faiss_index
|
74 |
try:
|
75 |
-
|
76 |
-
|
77 |
-
|
78 |
-
|
79 |
-
|
80 |
-
|
81 |
-
|
82 |
-
|
83 |
-
|
84 |
-
|
85 |
-
|
86 |
-
|
87 |
-
|
88 |
-
|
|
|
89 |
|
90 |
# Save the updated index
|
91 |
with open(index_path, "wb") as f:
|
92 |
pickle.dump(faiss_index, f)
|
93 |
|
94 |
-
return {"message": "
|
95 |
except Exception as e:
|
96 |
-
print(f"Error processing
|
97 |
return {"error": str(e)} # Provide informative error message
|
98 |
|
|
|
99 |
def process_and_query(state, question):
|
100 |
if question:
|
101 |
# Preprocess the question
|
|
|
69 |
sentences = sent_tokenize(text)
|
70 |
return sentences
|
71 |
|
72 |
+
def upload_files(files):
|
73 |
global faiss_index
|
74 |
try:
|
75 |
+
for file in files:
|
76 |
+
if file.name.endswith('.pdf'):
|
77 |
+
text = extract_text_from_pdf(file.read())
|
78 |
+
elif file.name.endswith('.docx'):
|
79 |
+
text = extract_text_from_docx(file.read())
|
80 |
+
else:
|
81 |
+
return {"error": "Unsupported file format"}
|
82 |
+
|
83 |
+
# Preprocess text
|
84 |
+
sentences = preprocess_text(text)
|
85 |
+
|
86 |
+
# Encode sentences and add to FAISS index
|
87 |
+
embeddings = embedding_model.encode(sentences)
|
88 |
+
for embedding in embeddings:
|
89 |
+
faiss_index.add(np.expand_dims(embedding, axis=0))
|
90 |
|
91 |
# Save the updated index
|
92 |
with open(index_path, "wb") as f:
|
93 |
pickle.dump(faiss_index, f)
|
94 |
|
95 |
+
return {"message": "Files processed successfully"}
|
96 |
except Exception as e:
|
97 |
+
print(f"Error processing files: {e}")
|
98 |
return {"error": str(e)} # Provide informative error message
|
99 |
|
100 |
+
|
101 |
def process_and_query(state, question):
|
102 |
if question:
|
103 |
# Preprocess the question
|