Spaces:
Sleeping
Sleeping
update
Browse files
app.py
CHANGED
@@ -307,14 +307,16 @@ demo: Optional[gr.Interface] = None # Assign your gradio demo to this variable
|
|
307 |
return_type = List[Hit]
|
308 |
|
309 |
## YOUR_CODE_STARTS_HERE
|
|
|
310 |
bm25_index = BM25Index.build_from_documents(
|
311 |
-
|
312 |
-
|
313 |
-
|
314 |
-
|
315 |
-
|
316 |
-
|
317 |
-
|
|
|
318 |
|
319 |
corpus_dict = {doc.collection_id: doc.text for doc in sciq.corpus}
|
320 |
|
@@ -339,4 +341,4 @@ demo = gr.Interface(
|
|
339 |
title="BM25 Query Engine"
|
340 |
)
|
341 |
## YOUR_CODE_ENDS_HERE
|
342 |
-
demo.launch()
|
|
|
307 |
return_type = List[Hit]
|
308 |
|
309 |
## YOUR_CODE_STARTS_HERE
|
310 |
+
# Building BM25 index and save:
|
311 |
bm25_index = BM25Index.build_from_documents(
|
312 |
+
documents=iter(sciq.corpus),
|
313 |
+
ndocs=12160,
|
314 |
+
show_progress_bar=True
|
315 |
+
)
|
316 |
+
bm25_index.save("output/bm25_index")
|
317 |
+
|
318 |
+
# Loading index and use BM25 retriever to retrieve:
|
319 |
+
bm25_retriever = BM25Retriever(index_dir="output/bm25_index")
|
320 |
|
321 |
corpus_dict = {doc.collection_id: doc.text for doc in sciq.corpus}
|
322 |
|
|
|
341 |
title="BM25 Query Engine"
|
342 |
)
|
343 |
## YOUR_CODE_ENDS_HERE
|
344 |
+
demo.launch()
|