zhenyundeng commited on
Commit
0c31614
·
1 Parent(s): 99c6d37

update files

Browse files
Files changed (1) hide show
  1. app.py +20 -5
app.py CHANGED
@@ -589,13 +589,13 @@ def get_text_from_link(url_link):
589
 
590
  def get_google_search_results(api_key, search_engine_id, google_search, sort_date, search_string, page=0):
591
  search_results = []
592
- for i in range(3):
593
  try:
594
  search_results += google_search(
595
  search_string,
596
  api_key,
597
  search_engine_id,
598
- num=10,
599
  start=0 + 10 * page,
600
  sort="date:r:19000101:" + sort_date,
601
  dateRestrict=None,
@@ -603,7 +603,23 @@ def get_google_search_results(api_key, search_engine_id, google_search, sort_dat
603
  )
604
  break
605
  except:
606
- sleep(3)
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
607
 
608
  return search_results
609
 
@@ -750,7 +766,6 @@ def averitec_search(claim, generate_question, speaker="they", check_date="2024-0
750
  for page_num in range(n_pages):
751
  search_results = get_google_search_results(api_key, search_engine_id, google_search, sort_date,
752
  this_search_string, page=page_num)
753
- search_results = search_results[:5]
754
 
755
  for result in search_results:
756
  link = str(result["link"])
@@ -829,7 +844,7 @@ def generate_step2_reference_corpus(reference_file):
829
  return tokenized_corpus, prompt_corpus
830
 
831
 
832
- def decorate_with_questions(claim, retrieve_evidence, top_k=10): # top_k=100
833
  #
834
  reference_file = "averitec/data/train.json"
835
  tokenized_corpus, prompt_corpus = generate_step2_reference_corpus(reference_file)
 
589
 
590
  def get_google_search_results(api_key, search_engine_id, google_search, sort_date, search_string, page=0):
591
  search_results = []
592
+ for i in range(1):
593
  try:
594
  search_results += google_search(
595
  search_string,
596
  api_key,
597
  search_engine_id,
598
+ num=3, # num=10,
599
  start=0 + 10 * page,
600
  sort="date:r:19000101:" + sort_date,
601
  dateRestrict=None,
 
603
  )
604
  break
605
  except:
606
+ sleep(1)
607
+
608
+ # for i in range(3):
609
+ # try:
610
+ # search_results += google_search(
611
+ # search_string,
612
+ # api_key,
613
+ # search_engine_id,
614
+ # num=10,
615
+ # start=0 + 10 * page,
616
+ # sort="date:r:19000101:" + sort_date,
617
+ # dateRestrict=None,
618
+ # gl="US"
619
+ # )
620
+ # break
621
+ # except:
622
+ # sleep(3)
623
 
624
  return search_results
625
 
 
766
  for page_num in range(n_pages):
767
  search_results = get_google_search_results(api_key, search_engine_id, google_search, sort_date,
768
  this_search_string, page=page_num)
 
769
 
770
  for result in search_results:
771
  link = str(result["link"])
 
844
  return tokenized_corpus, prompt_corpus
845
 
846
 
847
+ def decorate_with_questions(claim, retrieve_evidence, top_k=5): # top_k=10, 100
848
  #
849
  reference_file = "averitec/data/train.json"
850
  tokenized_corpus, prompt_corpus = generate_step2_reference_corpus(reference_file)