Spaces:
Running
Running
Update app.py
Browse files
app.py
CHANGED
@@ -9,6 +9,7 @@ from pydantic import BaseModel, Field
|
|
9 |
from tempfile import NamedTemporaryFile
|
10 |
from langchain_community.vectorstores import FAISS
|
11 |
from langchain_core.vectorstores import VectorStore
|
|
|
12 |
from langchain_community.document_loaders import PyPDFLoader
|
13 |
from langchain_community.embeddings import HuggingFaceEmbeddings
|
14 |
from llama_parse import LlamaParse
|
@@ -462,7 +463,10 @@ def get_response_from_pdf(query, model, selected_docs, num_calls=3, temperature=
|
|
462 |
return
|
463 |
|
464 |
# Pre-filter the documents
|
465 |
-
filtered_docs = [
|
|
|
|
|
|
|
466 |
|
467 |
logging.info(f"Number of documents after pre-filtering: {len(filtered_docs)}")
|
468 |
|
|
|
9 |
from tempfile import NamedTemporaryFile
|
10 |
from langchain_community.vectorstores import FAISS
|
11 |
from langchain_core.vectorstores import VectorStore
|
12 |
+
from langchain_core.documents import Document
|
13 |
from langchain_community.document_loaders import PyPDFLoader
|
14 |
from langchain_community.embeddings import HuggingFaceEmbeddings
|
15 |
from llama_parse import LlamaParse
|
|
|
463 |
return
|
464 |
|
465 |
# Pre-filter the documents
|
466 |
+
filtered_docs = []
|
467 |
+
for doc_id, doc in database.docstore._dict.items():
|
468 |
+
if isinstance(doc, Document) and doc.metadata.get("source") in selected_docs:
|
469 |
+
filtered_docs.append(doc)
|
470 |
|
471 |
logging.info(f"Number of documents after pre-filtering: {len(filtered_docs)}")
|
472 |
|