dobinyim commited on
Commit
3cc356b
·
verified ·
1 Parent(s): 7da07a5

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +9 -17
app.py CHANGED
@@ -49,31 +49,23 @@ hf_embeddings = HuggingFaceEndpointEmbeddings(
49
  huggingfacehub_api_token=HF_TOKEN,
50
  )
51
 
52
- vectorstore_path = "./data/vectorstore"
53
- index_file = os.path.join(vectorstore_path, "index.faiss")
54
-
55
- if os.path.exists(index_file):
56
  vectorstore = FAISS.load_local(
57
- vectorstore_path,
58
  hf_embeddings,
59
- allow_dangerous_deserialization=True
60
  )
61
  hf_retriever = vectorstore.as_retriever()
62
  print("Loaded Vectorstore")
63
  else:
64
  print("Indexing Files")
65
- os.makedirs(vectorstore_path, exist_ok=True)
66
- ### 4. INDEX FILES
67
- vectorstore = None
68
  for i in range(0, len(split_documents), 32):
69
- batch = split_documents[i:i+32]
70
- if vectorstore is None:
71
- vectorstore = FAISS.from_documents(batch, hf_embeddings)
72
- else:
73
- vectorstore.add_documents(batch)
74
- vectorstore.save_local(vectorstore_path)
75
- print("Vectorstore created and saved")
76
-
77
 
78
  hf_retriever = vectorstore.as_retriever()
79
 
 
49
  huggingfacehub_api_token=HF_TOKEN,
50
  )
51
 
52
+ if os.path.exists("./data/vectorstore"):
 
 
 
53
  vectorstore = FAISS.load_local(
54
+ "./data/vectorstore",
55
  hf_embeddings,
56
+ allow_dangerous_deserialization=True # this is necessary to load the vectorstore from disk as it's stored as a `.pkl` file.
57
  )
58
  hf_retriever = vectorstore.as_retriever()
59
  print("Loaded Vectorstore")
60
  else:
61
  print("Indexing Files")
62
+ os.makedirs("./data/vectorstore", exist_ok=True)
 
 
63
  for i in range(0, len(split_documents), 32):
64
+ if i == 0:
65
+ vectorstore = FAISS.from_documents(split_documents[i:i+32], hf_embeddings)
66
+ continue
67
+ vectorstore.add_documents(split_documents[i:i+32])
68
+ vectorstore.save_local("./data/vectorstore")
 
 
 
69
 
70
  hf_retriever = vectorstore.as_retriever()
71