bstraehle commited on
Commit
49dc208
·
verified ·
1 Parent(s): 8680017

Update utils/utils.py

Browse files
Files changed (1) hide show
  1. utils/utils.py +5 -7
utils/utils.py CHANGED
@@ -39,22 +39,20 @@ def get_dataset(dataset_type, level):
39
  dataset_repo = f"{username}/validation"
40
  dataset = load_dataset(dataset_repo, split="validation")
41
  df = dataset.to_pandas()
42
-
43
  if dataset_type == DATASET_TYPE_GAIA:
44
  print(f"filtering for dataset_type={dataset_type}")
45
- df = df[df["task_id"].str.startswith("gaia-")]
46
  elif dataset_type == DATASET_TYPE_HLE:
47
  print(f"filtering for dataset_type={dataset_type}")
48
- df = df[df["task_id"].str.startswith("hle-")]
49
 
50
- if level > 0:
51
- df = df[df["Level"] == level]
52
-
53
- print(df)
54
 
55
  result=[]
56
 
57
  for _, row in df.iterrows():
 
58
  result.append([row["Question"], row["Final answer"], row["file_name"]])
59
 
60
  return result
 
39
  dataset_repo = f"{username}/validation"
40
  dataset = load_dataset(dataset_repo, split="validation")
41
  df = dataset.to_pandas()
42
+
43
  if dataset_type == DATASET_TYPE_GAIA:
44
  print(f"filtering for dataset_type={dataset_type}")
45
+ df = df[df["Level"].isin([1, 2, 3])]
46
  elif dataset_type == DATASET_TYPE_HLE:
47
  print(f"filtering for dataset_type={dataset_type}")
48
+ df = df[df["Level"] == 0]
49
 
50
+ df = df[df["Level"] == level]
 
 
 
51
 
52
  result=[]
53
 
54
  for _, row in df.iterrows():
55
+ print(row)
56
  result.append([row["Question"], row["Final answer"], row["file_name"]])
57
 
58
  return result