asimmetti commited on
Commit
4f56247
·
verified ·
1 Parent(s): cbcf4e9
Files changed (1) hide show
  1. app.py +10 -8
app.py CHANGED
@@ -307,14 +307,16 @@ demo: Optional[gr.Interface] = None # Assign your gradio demo to this variable
307
  return_type = List[Hit]
308
 
309
  ## YOUR_CODE_STARTS_HERE
 
310
  bm25_index = BM25Index.build_from_documents(
311
- documents=iter(sciq.corpus),
312
- ndocs=len(sciq.corpus),
313
- k1=0.9,
314
- b=0.4
315
- )
316
- bm25_index.save("output/bm25_index_b") # Save index to directory
317
- bm25_retriever = BM25Retriever(index_dir="output/bm25_index_b")
 
318
 
319
  corpus_dict = {doc.collection_id: doc.text for doc in sciq.corpus}
320
 
@@ -339,4 +341,4 @@ demo = gr.Interface(
339
  title="BM25 Query Engine"
340
  )
341
  ## YOUR_CODE_ENDS_HERE
342
- demo.launch()
 
307
  return_type = List[Hit]
308
 
309
  ## YOUR_CODE_STARTS_HERE
310
+ # Building BM25 index and save:
311
  bm25_index = BM25Index.build_from_documents(
312
+ documents=iter(sciq.corpus),
313
+ ndocs=12160,
314
+ show_progress_bar=True
315
+ )
316
+ bm25_index.save("output/bm25_index")
317
+
318
+ # Loading index and use BM25 retriever to retrieve:
319
+ bm25_retriever = BM25Retriever(index_dir="output/bm25_index")
320
 
321
  corpus_dict = {doc.collection_id: doc.text for doc in sciq.corpus}
322
 
 
341
  title="BM25 Query Engine"
342
  )
343
  ## YOUR_CODE_ENDS_HERE
344
+ demo.launch()