Spaces:
Runtime error
Runtime error
Commit
·
69f292c
1
Parent(s):
9d4b1c5
Update app.py
Browse files
app.py
CHANGED
@@ -200,29 +200,34 @@ if len(ALL_FILES) > 0:
|
|
200 |
# we will use batches of 64
|
201 |
batch_size = 128
|
202 |
# docs = docs['documents']
|
203 |
-
with st.spinner(
|
204 |
-
|
205 |
-
|
206 |
-
|
207 |
-
|
208 |
-
|
209 |
-
|
210 |
-
|
211 |
-
|
212 |
-
|
213 |
-
|
214 |
-
|
215 |
-
|
216 |
-
|
217 |
-
|
218 |
-
|
219 |
-
|
220 |
-
|
221 |
-
|
222 |
-
|
223 |
-
|
224 |
-
|
225 |
-
|
|
|
|
|
|
|
|
|
|
|
226 |
|
227 |
top_k_reader = st.sidebar.slider(
|
228 |
"Max. number of answers",
|
|
|
200 |
# we will use batches of 64
|
201 |
batch_size = 128
|
202 |
# docs = docs['documents']
|
203 |
+
# with st.spinner(
|
204 |
+
# "🧠 Performing indexing of uplaoded documents... \n "
|
205 |
+
# ):
|
206 |
+
my_bar = st.progress(0)
|
207 |
+
upload_count = 0
|
208 |
+
for i in range(0, len(docs), batch_size):
|
209 |
+
# find end of batch
|
210 |
+
i_end = min(i+batch_size, len(docs))
|
211 |
+
# extract batch
|
212 |
+
batch = [doc.content for doc in docs[i:i_end]]
|
213 |
+
# generate embeddings for batch
|
214 |
+
emb = sentence_encoder.encode(batch).tolist()
|
215 |
+
# get metadata
|
216 |
+
# meta = [doc.meta for doc in docs[i:i_end]]
|
217 |
+
meta = []
|
218 |
+
for doc in docs[i:i_end]:
|
219 |
+
meta_dict = doc.meta
|
220 |
+
meta_dict["text"] = doc.content
|
221 |
+
meta.append(meta_dict)
|
222 |
+
# create unique IDs
|
223 |
+
ids = [doc.id for doc in docs[i:i_end]]
|
224 |
+
# add all to upsert list
|
225 |
+
to_upsert = list(zip(ids, emb, meta))
|
226 |
+
# upsert/insert these records to pinecone
|
227 |
+
_ = index.upsert(vectors=to_upsert)
|
228 |
+
upload_count+=batch_size
|
229 |
+
upload_percentage = int((upload_count/len(docs))*100)
|
230 |
+
my_bar.progress(percent_complete + upload_percentage)
|
231 |
|
232 |
top_k_reader = st.sidebar.slider(
|
233 |
"Max. number of answers",
|