Spaces:
Build error
Build error
zhenyundeng
commited on
Commit
·
0c31614
1
Parent(s):
99c6d37
update files
Browse files
app.py
CHANGED
|
@@ -589,13 +589,13 @@ def get_text_from_link(url_link):
|
|
| 589 |
|
| 590 |
def get_google_search_results(api_key, search_engine_id, google_search, sort_date, search_string, page=0):
|
| 591 |
search_results = []
|
| 592 |
-
for i in range(
|
| 593 |
try:
|
| 594 |
search_results += google_search(
|
| 595 |
search_string,
|
| 596 |
api_key,
|
| 597 |
search_engine_id,
|
| 598 |
-
num=10,
|
| 599 |
start=0 + 10 * page,
|
| 600 |
sort="date:r:19000101:" + sort_date,
|
| 601 |
dateRestrict=None,
|
|
@@ -603,7 +603,23 @@ def get_google_search_results(api_key, search_engine_id, google_search, sort_dat
|
|
| 603 |
)
|
| 604 |
break
|
| 605 |
except:
|
| 606 |
-
sleep(
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 607 |
|
| 608 |
return search_results
|
| 609 |
|
|
@@ -750,7 +766,6 @@ def averitec_search(claim, generate_question, speaker="they", check_date="2024-0
|
|
| 750 |
for page_num in range(n_pages):
|
| 751 |
search_results = get_google_search_results(api_key, search_engine_id, google_search, sort_date,
|
| 752 |
this_search_string, page=page_num)
|
| 753 |
-
search_results = search_results[:5]
|
| 754 |
|
| 755 |
for result in search_results:
|
| 756 |
link = str(result["link"])
|
|
@@ -829,7 +844,7 @@ def generate_step2_reference_corpus(reference_file):
|
|
| 829 |
return tokenized_corpus, prompt_corpus
|
| 830 |
|
| 831 |
|
| 832 |
-
def decorate_with_questions(claim, retrieve_evidence, top_k=
|
| 833 |
#
|
| 834 |
reference_file = "averitec/data/train.json"
|
| 835 |
tokenized_corpus, prompt_corpus = generate_step2_reference_corpus(reference_file)
|
|
|
|
| 589 |
|
| 590 |
def get_google_search_results(api_key, search_engine_id, google_search, sort_date, search_string, page=0):
|
| 591 |
search_results = []
|
| 592 |
+
for i in range(1):
|
| 593 |
try:
|
| 594 |
search_results += google_search(
|
| 595 |
search_string,
|
| 596 |
api_key,
|
| 597 |
search_engine_id,
|
| 598 |
+
num=3, # num=10,
|
| 599 |
start=0 + 10 * page,
|
| 600 |
sort="date:r:19000101:" + sort_date,
|
| 601 |
dateRestrict=None,
|
|
|
|
| 603 |
)
|
| 604 |
break
|
| 605 |
except:
|
| 606 |
+
sleep(1)
|
| 607 |
+
|
| 608 |
+
# for i in range(3):
|
| 609 |
+
# try:
|
| 610 |
+
# search_results += google_search(
|
| 611 |
+
# search_string,
|
| 612 |
+
# api_key,
|
| 613 |
+
# search_engine_id,
|
| 614 |
+
# num=10,
|
| 615 |
+
# start=0 + 10 * page,
|
| 616 |
+
# sort="date:r:19000101:" + sort_date,
|
| 617 |
+
# dateRestrict=None,
|
| 618 |
+
# gl="US"
|
| 619 |
+
# )
|
| 620 |
+
# break
|
| 621 |
+
# except:
|
| 622 |
+
# sleep(3)
|
| 623 |
|
| 624 |
return search_results
|
| 625 |
|
|
|
|
| 766 |
for page_num in range(n_pages):
|
| 767 |
search_results = get_google_search_results(api_key, search_engine_id, google_search, sort_date,
|
| 768 |
this_search_string, page=page_num)
|
|
|
|
| 769 |
|
| 770 |
for result in search_results:
|
| 771 |
link = str(result["link"])
|
|
|
|
| 844 |
return tokenized_corpus, prompt_corpus
|
| 845 |
|
| 846 |
|
| 847 |
+
def decorate_with_questions(claim, retrieve_evidence, top_k=5): # top_k=10, 100
|
| 848 |
#
|
| 849 |
reference_file = "averitec/data/train.json"
|
| 850 |
tokenized_corpus, prompt_corpus = generate_step2_reference_corpus(reference_file)
|