ZoniaChatbot commited on
Commit
e9c5a00
verified
1 Parent(s): 793c82d

Update chatpdf.py

Browse files
Files changed (1) hide show
  1. chatpdf.py +7 -8
chatpdf.py CHANGED
@@ -421,14 +421,13 @@ class Rag:
421
  sim_contents = self.sim_model.most_similar(query, topn=self.similarity_top_k)
422
  # Get reference results from corpus
423
  hit_chunk_dict = dict()
424
- threshold_score = 0.5 # Establece un umbral para filtrar fragmentos irrelevantes
425
-
426
- for query_id, id_score_dict in sim_contents.items():
427
- for corpus_id, s in id_score_dict.items():
428
- if s > threshold_score: # Filtrar por puntuaci贸n de similitud
429
- hit_chunk = self.sim_model.corpus[corpus_id]
430
- reference_results.append(hit_chunk)
431
- hit_chunk_dict[corpus_id] = hit_chunk
432
 
433
  if reference_results:
434
  if self.rerank_model is not None:
 
421
  sim_contents = self.sim_model.most_similar(query, topn=self.similarity_top_k)
422
  # Get reference results from corpus
423
  hit_chunk_dict = dict()
424
+
425
+ for c in sim_contents:
426
+ for id_score_dict in c:
427
+ corpus_id = id_score_dict['corpus_id']
428
+ hit_chunk = id_score_dict["corpus_doc"]
429
+ reference_results.append(hit_chunk)
430
+ hit_chunk_dict[corpus_id] = hit_chunk
 
431
 
432
  if reference_results:
433
  if self.rerank_model is not None: