Spaces:
Build error
Build error
zhenyundeng
commited on
Commit
·
0c31614
1
Parent(s):
99c6d37
update files
Browse files
app.py
CHANGED
@@ -589,13 +589,13 @@ def get_text_from_link(url_link):
|
|
589 |
|
590 |
def get_google_search_results(api_key, search_engine_id, google_search, sort_date, search_string, page=0):
|
591 |
search_results = []
|
592 |
-
for i in range(
|
593 |
try:
|
594 |
search_results += google_search(
|
595 |
search_string,
|
596 |
api_key,
|
597 |
search_engine_id,
|
598 |
-
num=10,
|
599 |
start=0 + 10 * page,
|
600 |
sort="date:r:19000101:" + sort_date,
|
601 |
dateRestrict=None,
|
@@ -603,7 +603,23 @@ def get_google_search_results(api_key, search_engine_id, google_search, sort_dat
|
|
603 |
)
|
604 |
break
|
605 |
except:
|
606 |
-
sleep(
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
607 |
|
608 |
return search_results
|
609 |
|
@@ -750,7 +766,6 @@ def averitec_search(claim, generate_question, speaker="they", check_date="2024-0
|
|
750 |
for page_num in range(n_pages):
|
751 |
search_results = get_google_search_results(api_key, search_engine_id, google_search, sort_date,
|
752 |
this_search_string, page=page_num)
|
753 |
-
search_results = search_results[:5]
|
754 |
|
755 |
for result in search_results:
|
756 |
link = str(result["link"])
|
@@ -829,7 +844,7 @@ def generate_step2_reference_corpus(reference_file):
|
|
829 |
return tokenized_corpus, prompt_corpus
|
830 |
|
831 |
|
832 |
-
def decorate_with_questions(claim, retrieve_evidence, top_k=
|
833 |
#
|
834 |
reference_file = "averitec/data/train.json"
|
835 |
tokenized_corpus, prompt_corpus = generate_step2_reference_corpus(reference_file)
|
|
|
589 |
|
590 |
def get_google_search_results(api_key, search_engine_id, google_search, sort_date, search_string, page=0):
|
591 |
search_results = []
|
592 |
+
for i in range(1):
|
593 |
try:
|
594 |
search_results += google_search(
|
595 |
search_string,
|
596 |
api_key,
|
597 |
search_engine_id,
|
598 |
+
num=3, # num=10,
|
599 |
start=0 + 10 * page,
|
600 |
sort="date:r:19000101:" + sort_date,
|
601 |
dateRestrict=None,
|
|
|
603 |
)
|
604 |
break
|
605 |
except:
|
606 |
+
sleep(1)
|
607 |
+
|
608 |
+
# for i in range(3):
|
609 |
+
# try:
|
610 |
+
# search_results += google_search(
|
611 |
+
# search_string,
|
612 |
+
# api_key,
|
613 |
+
# search_engine_id,
|
614 |
+
# num=10,
|
615 |
+
# start=0 + 10 * page,
|
616 |
+
# sort="date:r:19000101:" + sort_date,
|
617 |
+
# dateRestrict=None,
|
618 |
+
# gl="US"
|
619 |
+
# )
|
620 |
+
# break
|
621 |
+
# except:
|
622 |
+
# sleep(3)
|
623 |
|
624 |
return search_results
|
625 |
|
|
|
766 |
for page_num in range(n_pages):
|
767 |
search_results = get_google_search_results(api_key, search_engine_id, google_search, sort_date,
|
768 |
this_search_string, page=page_num)
|
|
|
769 |
|
770 |
for result in search_results:
|
771 |
link = str(result["link"])
|
|
|
844 |
return tokenized_corpus, prompt_corpus
|
845 |
|
846 |
|
847 |
+
def decorate_with_questions(claim, retrieve_evidence, top_k=5): # top_k=10, 100
|
848 |
#
|
849 |
reference_file = "averitec/data/train.json"
|
850 |
tokenized_corpus, prompt_corpus = generate_step2_reference_corpus(reference_file)
|