Update eval.py
Browse files
eval.py
CHANGED
|
@@ -40,9 +40,9 @@ def statistics(commonsense_statistic):
|
|
| 40 |
def eval_score(validation_or_test: str, file_path: str, TOKEN):
|
| 41 |
|
| 42 |
if validation_or_test == 'validation':
|
| 43 |
-
query_data_list = load_dataset('osunlp/
|
| 44 |
elif validation_or_test == 'test':
|
| 45 |
-
query_data_list = load_dataset('osunlp/
|
| 46 |
|
| 47 |
query_data_list = [x for x in query_data_list]
|
| 48 |
hardConstraint_statistic= {level:{day:[] for day in [3,5,7]} for level in ['easy','medium','hard']}
|
|
|
|
| 40 |
def eval_score(validation_or_test: str, file_path: str, TOKEN):
|
| 41 |
|
| 42 |
if validation_or_test == 'validation':
|
| 43 |
+
query_data_list = load_dataset('osunlp/TravelPlannerEval','validation',token=TOKEN)['validation']
|
| 44 |
elif validation_or_test == 'test':
|
| 45 |
+
query_data_list = load_dataset('osunlp/TravelPlannerEval','test',token=TOKEN)['test']
|
| 46 |
|
| 47 |
query_data_list = [x for x in query_data_list]
|
| 48 |
hardConstraint_statistic= {level:{day:[] for day in [3,5,7]} for level in ['easy','medium','hard']}
|